|
|
- # coding: utf-8
- from __future__ import unicode_literals
-
- from .common import InfoExtractor
- from ..compat import compat_str
- from ..utils import (
- float_or_none,
- unified_strdate,
- )
-
-
- class DctpTvIE(InfoExtractor):
- _VALID_URL = r'https?://(?:www\.)?dctp\.tv/(?:#/)?filme/(?P<id>[^/?#&]+)'
- _TEST = {
- 'url': 'http://www.dctp.tv/filme/videoinstallation-fuer-eine-kaufhausfassade/',
- 'info_dict': {
- 'id': '95eaa4f33dad413aa17b4ee613cccc6c',
- 'display_id': 'videoinstallation-fuer-eine-kaufhausfassade',
- 'ext': 'flv',
- 'title': 'Videoinstallation für eine Kaufhausfassade',
- 'description': 'Kurzfilm',
- 'upload_date': '20110407',
- 'thumbnail': r're:^https?://.*\.jpg$',
- 'duration': 71.24,
- },
- 'params': {
- # rtmp download
- 'skip_download': True,
- },
- }
-
- def _real_extract(self, url):
- display_id = self._match_id(url)
-
- webpage = self._download_webpage(url, display_id)
-
- video_id = self._html_search_meta(
- 'DC.identifier', webpage, 'video id',
- default=None) or self._search_regex(
- r'id=["\']uuid[^>]+>([^<]+)<', webpage, 'video id')
-
- title = self._og_search_title(webpage)
-
- servers = self._download_json(
- 'http://www.dctp.tv/streaming_servers/', display_id,
- note='Downloading server list', fatal=False)
-
- if servers:
- endpoint = next(
- server['endpoint']
- for server in servers
- if isinstance(server.get('endpoint'), compat_str) and
- 'cloudfront' in server['endpoint'])
- else:
- endpoint = 'rtmpe://s2pqqn4u96e4j8.cloudfront.net/cfx/st/'
-
- app = self._search_regex(
- r'^rtmpe?://[^/]+/(?P<app>.*)$', endpoint, 'app')
-
- formats = [{
- 'url': endpoint,
- 'app': app,
- 'play_path': 'mp4:%s_dctp_0500_4x3.m4v' % video_id,
- 'page_url': url,
- 'player_url': 'http://svm-prod-dctptv-static.s3.amazonaws.com/dctptv-relaunch2012-109.swf',
- 'ext': 'flv',
- }]
-
- description = self._html_search_meta('DC.description', webpage)
- upload_date = unified_strdate(
- self._html_search_meta('DC.date.created', webpage))
- thumbnail = self._og_search_thumbnail(webpage)
- duration = float_or_none(self._search_regex(
- r'id=["\']duration_in_ms[^+]>(\d+)', webpage, 'duration',
- default=None), scale=1000)
-
- return {
- 'id': video_id,
- 'title': title,
- 'formats': formats,
- 'display_id': display_id,
- 'description': description,
- 'upload_date': upload_date,
- 'thumbnail': thumbnail,
- 'duration': duration,
- }
|