|
@ -0,0 +1,93 @@ |
|
|
|
|
|
from __future__ import unicode_literals |
|
|
|
|
|
from .common import InfoExtractor |
|
|
|
|
|
from .common import ExtractorError |
|
|
|
|
|
import json |
|
|
|
|
|
import re |
|
|
|
|
|
from ..utils import int_or_none |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CamModelsIE(InfoExtractor): |
|
|
|
|
|
_VALID_URL = r'https?://(?:www\.)?cammodels\.com/cam/(?P<id>\w+)' |
|
|
|
|
|
_HEADERS = { |
|
|
|
|
|
'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.2704.103 Safari/537.36' |
|
|
|
|
|
# Needed because server doesn't return links to video URLs if a browser-like User-Agent is not used |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url): |
|
|
|
|
|
video_id = self._match_id(url) |
|
|
|
|
|
webpage = self._download_webpage( |
|
|
|
|
|
url, |
|
|
|
|
|
video_id, |
|
|
|
|
|
headers=self._HEADERS) |
|
|
|
|
|
manifest_url_root = self._html_search_regex( |
|
|
|
|
|
r'manifestUrlRoot=(?P<id>https?:\/\/(www\.)?[-a-zA-Z0-9@:%._\+~#=]{2,256}\.[a-z]{2,6}\b([-a-zA-Z0-9@:%_\+.~#?&//=]*))', |
|
|
|
|
|
webpage, |
|
|
|
|
|
'manifest', |
|
|
|
|
|
None, |
|
|
|
|
|
False) |
|
|
|
|
|
if not manifest_url_root: |
|
|
|
|
|
offline = self._html_search_regex( |
|
|
|
|
|
r'(?P<id>I\'m offline, but let\'s stay connected!)', |
|
|
|
|
|
webpage, |
|
|
|
|
|
'offline indicator', |
|
|
|
|
|
None, |
|
|
|
|
|
False) |
|
|
|
|
|
private = self._html_search_regex( |
|
|
|
|
|
r'(?P<id>I’m in a private show right now)', |
|
|
|
|
|
webpage, |
|
|
|
|
|
'private show indicator', |
|
|
|
|
|
None, |
|
|
|
|
|
False) |
|
|
|
|
|
err = 'This user is currently offline, so nothing can be downloaded.' if offline \ |
|
|
|
|
|
else 'This user is doing a private show, which requires payment. This extractor currently does not support private streams.' if private \ |
|
|
|
|
|
else 'Unable to find link to stream info on webpage. Room is not offline, so something else is wrong.' |
|
|
|
|
|
raise ExtractorError( |
|
|
|
|
|
err, |
|
|
|
|
|
expected=True if offline or private else False, |
|
|
|
|
|
video_id=video_id |
|
|
|
|
|
) |
|
|
|
|
|
manifest_url = manifest_url_root + video_id + '.json' |
|
|
|
|
|
manifest = self._download_json( |
|
|
|
|
|
manifest_url, |
|
|
|
|
|
video_id, |
|
|
|
|
|
'Downloading links to streams.', |
|
|
|
|
|
'Link to stream URLs was found, but we couldn\'t access it.', |
|
|
|
|
|
headers=self._HEADERS) |
|
|
|
|
|
try: |
|
|
|
|
|
formats = [] |
|
|
|
|
|
for fmtName in ['mp4-rtmp', 'mp4-hls']: |
|
|
|
|
|
for encoding in manifest['formats'][fmtName]['encodings']: |
|
|
|
|
|
formats.append({ |
|
|
|
|
|
'ext': 'mp4', |
|
|
|
|
|
'url': encoding['location'], |
|
|
|
|
|
'width': int_or_none(encoding.get('videoWidth')), |
|
|
|
|
|
'height': int_or_none(encoding.get('videoHeight')), |
|
|
|
|
|
'vbr': int_or_none(encoding.get('videoKbps')), |
|
|
|
|
|
'abr': int_or_none(encoding.get('audioKbps')), |
|
|
|
|
|
'format_id': fmtName + str(encoding.get('videoWidth')) |
|
|
|
|
|
}) |
|
|
|
|
|
# If they change the JSON format, then fallback to parsing out RTMP links via regex. |
|
|
|
|
|
except KeyError: |
|
|
|
|
|
manifest_json = json.dumps(manifest) |
|
|
|
|
|
manifest_links = re.finditer( |
|
|
|
|
|
r'(?P<id>rtmp?:\/\/[-a-zA-Z0-9@:%._\+~#=]{2,256}\.[a-z]{2,6}\b([-a-zA-Z0-9@:%_\+.~#&//=]*))', |
|
|
|
|
|
manifest_json) |
|
|
|
|
|
if not manifest_links: |
|
|
|
|
|
raise ExtractorError( |
|
|
|
|
|
'Link to stream info was found, but we couldn\'t read the response. This is probably a bug.', |
|
|
|
|
|
expected=False, |
|
|
|
|
|
video_id=video_id) |
|
|
|
|
|
formats = [] |
|
|
|
|
|
for manifest_link in manifest_links: |
|
|
|
|
|
url = manifest_link.group('id') |
|
|
|
|
|
formats.append({ |
|
|
|
|
|
'ext': 'mp4', |
|
|
|
|
|
'url': url, |
|
|
|
|
|
'format_id': url.split(sep='/')[-1] |
|
|
|
|
|
}) |
|
|
|
|
|
self._sort_formats(formats) |
|
|
|
|
|
return { |
|
|
|
|
|
'id': video_id, |
|
|
|
|
|
'title': self._live_title(video_id), |
|
|
|
|
|
'formats': formats |
|
|
|
|
|
} |