|
|
@ -0,0 +1,101 @@ |
|
|
|
# coding: utf-8 |
|
|
|
from __future__ import unicode_literals |
|
|
|
|
|
|
|
import json |
|
|
|
import re |
|
|
|
|
|
|
|
from .common import InfoExtractor |
|
|
|
from ..utils import ExtractorError |
|
|
|
|
|
|
|
|
|
|
|
class TuneInIE(InfoExtractor): |
|
|
|
_VALID_URL = r'''(?x)https?://(?:www\.)? |
|
|
|
(?: |
|
|
|
tunein\.com/ |
|
|
|
(?: |
|
|
|
radio/.*?-s| |
|
|
|
station/.*?StationId\= |
|
|
|
)(?P<id>[0-9]+) |
|
|
|
|tun\.in/(?P<redirect_id>[A-Za-z0-9]+) |
|
|
|
) |
|
|
|
''' |
|
|
|
|
|
|
|
_INFO_DICT = { |
|
|
|
'id': '34682', |
|
|
|
'title': 'Jazz 24 on 88.5 Jazz24 - KPLU-HD2', |
|
|
|
'ext': 'AAC', |
|
|
|
'thumbnail': 're:^https?://.*\.png$', |
|
|
|
'location': 'Tacoma, WA', |
|
|
|
} |
|
|
|
_TESTS = [ |
|
|
|
{ |
|
|
|
'url': 'http://tunein.com/radio/Jazz24-885-s34682/', |
|
|
|
'info_dict': _INFO_DICT, |
|
|
|
'params': { |
|
|
|
'skip_download': True, # live stream |
|
|
|
}, |
|
|
|
}, |
|
|
|
{ # test redirection |
|
|
|
'url': 'http://tun.in/ser7s', |
|
|
|
'info_dict': _INFO_DICT, |
|
|
|
'params': { |
|
|
|
'skip_download': True, # live stream |
|
|
|
}, |
|
|
|
}, |
|
|
|
] |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
mobj = re.match(self._VALID_URL, url) |
|
|
|
redirect_id = mobj.group('redirect_id') |
|
|
|
if redirect_id: |
|
|
|
# The server doesn't support HEAD requests |
|
|
|
urlh = self._request_webpage( |
|
|
|
url, redirect_id, note='Downloading redirect page') |
|
|
|
url = urlh.geturl() |
|
|
|
self.to_screen('Following redirect: %s' % url) |
|
|
|
mobj = re.match(self._VALID_URL, url) |
|
|
|
station_id = mobj.group('id') |
|
|
|
|
|
|
|
webpage = self._download_webpage( |
|
|
|
url, station_id, note='Downloading station webpage') |
|
|
|
|
|
|
|
payload = self._html_search_regex( |
|
|
|
r'(?m)TuneIn\.payload\s*=\s*(\{[^$]+?)$', webpage, 'JSON data') |
|
|
|
json_data = json.loads(payload) |
|
|
|
station_info = json_data['Station']['broadcast'] |
|
|
|
title = station_info['Title'] |
|
|
|
thumbnail = station_info.get('Logo') |
|
|
|
location = station_info.get('Location') |
|
|
|
streams_url = station_info.get('StreamUrl') |
|
|
|
if not streams_url: |
|
|
|
raise ExtractorError('No downloadable streams found', |
|
|
|
expected=True) |
|
|
|
stream_data = self._download_webpage( |
|
|
|
streams_url, station_id, note='Downloading stream data') |
|
|
|
streams = json.loads(self._search_regex( |
|
|
|
r'\((.*)\);', stream_data, 'stream info'))['Streams'] |
|
|
|
|
|
|
|
is_live = None |
|
|
|
formats = [] |
|
|
|
for stream in streams: |
|
|
|
if stream.get('Type') == 'Live': |
|
|
|
is_live = True |
|
|
|
formats.append({ |
|
|
|
'abr': stream.get('Bandwidth'), |
|
|
|
'ext': stream.get('MediaType'), |
|
|
|
'acodec': stream.get('MediaType'), |
|
|
|
'vcodec': 'none', |
|
|
|
'url': stream.get('Url'), |
|
|
|
# Sometimes streams with the highest quality do not exist |
|
|
|
'preference': stream.get('Reliability'), |
|
|
|
}) |
|
|
|
self._sort_formats(formats) |
|
|
|
|
|
|
|
return { |
|
|
|
'id': station_id, |
|
|
|
'title': title, |
|
|
|
'formats': formats, |
|
|
|
'thumbnail': thumbnail, |
|
|
|
'location': location, |
|
|
|
'is_live': is_live, |
|
|
|
} |