|
|
@ -15,6 +15,7 @@ import email.utils |
|
|
|
import gzip |
|
|
|
import htmlentitydefs |
|
|
|
import httplib |
|
|
|
import json # TODO: json for 2.5 |
|
|
|
import locale |
|
|
|
import math |
|
|
|
import netrc |
|
|
@ -2563,6 +2564,80 @@ class FacebookIE(InfoExtractor): |
|
|
|
except UnavailableVideoError, err: |
|
|
|
self._downloader.trouble(u'\nERROR: unable to download video') |
|
|
|
|
|
|
|
class BlipTVIE(InfoExtractor): |
|
|
|
"""Information extractor for blip.tv""" |
|
|
|
|
|
|
|
_VALID_URL = r'^(?:https?://)?(?:\w+\.)?blip.tv/(.+)$' |
|
|
|
_URL_EXT = r'^.*\.([a-z0-9]+)$' |
|
|
|
|
|
|
|
@staticmethod |
|
|
|
def suitable(url): |
|
|
|
return (re.match(BlipTVIE._VALID_URL, url) is not None) |
|
|
|
|
|
|
|
def report_download_webpage(self, file_id): |
|
|
|
"""Report webpage download.""" |
|
|
|
self._downloader.to_screen(u'[%s] %s: Downloading webpage' % (self.service_name, file_id)) |
|
|
|
|
|
|
|
def report_extraction(self, file_id): |
|
|
|
"""Report information extraction.""" |
|
|
|
self._downloader.to_screen(u'[%s] %s: Extracting information' % (self.service_name, file_id)) |
|
|
|
|
|
|
|
@property |
|
|
|
def service_name(self): |
|
|
|
return u'blip.tv' |
|
|
|
|
|
|
|
def _simplify_title(self, title): |
|
|
|
res = re.sub(ur'(?u)([^%s]+)' % simple_title_chars, ur'_', title) |
|
|
|
res = res.strip(ur'_') |
|
|
|
return res |
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
mobj = re.match(self._VALID_URL, url) |
|
|
|
if mobj is None: |
|
|
|
self._downloader.trouble(u'ERROR: invalid URL: %s' % url) |
|
|
|
return |
|
|
|
|
|
|
|
json_url = url + ('&' if '?' in url else '?') + 'skin=json&version=2&no_wrap=1' |
|
|
|
request = urllib2.Request(json_url) |
|
|
|
try: |
|
|
|
json_code = urllib2.urlopen(request).read() |
|
|
|
except (urllib2.URLError, httplib.HTTPException, socket.error), err: |
|
|
|
self._downloader.trouble(u'ERROR: unable to download video info webpage: %s' % str(err)) |
|
|
|
return |
|
|
|
try: |
|
|
|
json_data = json.loads(json_code) |
|
|
|
data = json_data['Post'] |
|
|
|
|
|
|
|
upload_date = datetime.datetime.strptime(data['datestamp'], '%m-%d-%y %H:%M%p').strftime('%Y%m%d') |
|
|
|
video_url = data['media']['url'] |
|
|
|
umobj = re.match(self._URL_EXT, video_url) |
|
|
|
if umobj is None: |
|
|
|
raise ValueError('Can not determine filename extension') |
|
|
|
ext = umobj.group(1) |
|
|
|
|
|
|
|
info = { |
|
|
|
'id': data['item_id'], |
|
|
|
'url': video_url, |
|
|
|
'uploader': data['display_name'], |
|
|
|
'upload_date': upload_date, |
|
|
|
'title': data['title'], |
|
|
|
'stitle': self._simplify_title(data['title']), |
|
|
|
'ext': ext, |
|
|
|
'format': data['media']['mimeType'], |
|
|
|
'thumbnail': data['thumbnailUrl'], |
|
|
|
'description': data['description'], |
|
|
|
'player_url': data['embedUrl'] |
|
|
|
} |
|
|
|
except (ValueError,KeyError), err: |
|
|
|
self._downloader.trouble(u'ERROR: unable to parse video information: %s' % str(err)) |
|
|
|
return |
|
|
|
|
|
|
|
try: |
|
|
|
self._downloader.process_info(info) |
|
|
|
except UnavailableVideoError, err: |
|
|
|
self._downloader.trouble(u'\nERROR: unable to download video') |
|
|
|
|
|
|
|
|
|
|
|
class PostProcessor(object): |
|
|
|
"""Post Processor class. |
|
|
|
|
|
|
@ -2911,6 +2986,7 @@ if __name__ == '__main__': |
|
|
|
yahoo_search_ie = YahooSearchIE(yahoo_ie) |
|
|
|
deposit_files_ie = DepositFilesIE() |
|
|
|
facebook_ie = FacebookIE() |
|
|
|
bliptv_ie = BlipTVIE() |
|
|
|
generic_ie = GenericIE() |
|
|
|
|
|
|
|
# File downloader |
|
|
@ -2963,6 +3039,7 @@ if __name__ == '__main__': |
|
|
|
fd.add_info_extractor(yahoo_search_ie) |
|
|
|
fd.add_info_extractor(deposit_files_ie) |
|
|
|
fd.add_info_extractor(facebook_ie) |
|
|
|
fd.add_info_extractor(bliptv_ie) |
|
|
|
|
|
|
|
# This must come last since it's the |
|
|
|
# fallback if none of the others work |
|
|
|