zolfa
/
youtube-dl

# coding: utf-8from __future__ import unicode_literals
from .common import InfoExtractorfrom ..utils import remove_end

class BioBioChileTVIE(InfoExtractor):    _VALID_URL = r'https?://tv\.biobiochile\.cl/notas/(?:[^/]+/)+(?P<id>[^/]+)\.shtml'
    _TESTS = [{        'url': 'http://tv.biobiochile.cl/notas/2015/10/21/sobre-camaras-y-camarillas-parlamentarias.shtml',        'md5': '26f51f03cf580265defefb4518faec09',        'info_dict': {            'id': 'sobre-camaras-y-camarillas-parlamentarias',            'ext': 'mp4',            'title': 'Sobre Cámaras y camarillas parlamentarias',            'thumbnail': 're:^https?://.*\.jpg$',            'uploader': 'Fernando Atria',        },    }, {        # different uploader layout        'url': 'http://tv.biobiochile.cl/notas/2016/03/18/natalia-valdebenito-repasa-a-diputado-hasbun-paso-a-la-categoria-de-hablar-brutalidades.shtml',        'md5': 'edc2e6b58974c46d5b047dea3c539ff3',        'info_dict': {            'id': 'natalia-valdebenito-repasa-a-diputado-hasbun-paso-a-la-categoria-de-hablar-brutalidades',            'ext': 'mp4',            'title': 'Natalia Valdebenito repasa a diputado Hasbún: Pasó a la categoría de hablar brutalidades',            'thumbnail': 're:^https?://.*\.jpg$',            'uploader': 'Piangella Obrador',        },        'params': {            'skip_download': True,        },    }, {        'url': 'http://tv.biobiochile.cl/notas/2015/10/22/ninos-transexuales-de-quien-es-la-decision.shtml',        'only_matching': True,    }, {        'url': 'http://tv.biobiochile.cl/notas/2015/10/21/exclusivo-hector-pinto-formador-de-chupete-revela-version-del-ex-delantero-albo.shtml',        'only_matching': True,    }]
    def _real_extract(self, url):        video_id = self._match_id(url)
        webpage = self._download_webpage(url, video_id)
        title = remove_end(self._og_search_title(webpage), ' - BioBioChile TV')
        file_url = self._search_regex(            r'loadFWPlayerVideo\([^,]+,\s*(["\'])(?P<url>.+?)\1',            webpage, 'file url', group='url')
        base_url = self._search_regex(            r'file\s*:\s*(["\'])(?P<url>.+?)\1\s*\+\s*fileURL', webpage,            'base url', default='http://unlimited2-cl.digitalproserver.com/bbtv/',            group='url')
        formats = self._extract_m3u8_formats(            '%s%s/playlist.m3u8' % (base_url, file_url), video_id, 'mp4',            entry_protocol='m3u8_native', m3u8_id='hls', fatal=False)        f = {            'url': '%s%s' % (base_url, file_url),            'format_id': 'http',            'protocol': 'http',            'preference': 1,        }        if formats:            f_copy = formats[-1].copy()            f_copy.update(f)            f = f_copy        formats.append(f)        self._sort_formats(formats)
        thumbnail = self._og_search_thumbnail(webpage)        uploader = self._html_search_regex(            r'<a[^>]+href=["\']https?://busca\.biobiochile\.cl/author[^>]+>(.+?)</a>',            webpage, 'uploader', fatal=False)
        return {            'id': video_id,            'title': title,            'thumbnail': thumbnail,            'uploader': uploader,            'formats': formats,        }