Browse Source

[imdb] Fix extraction in python 2.6

Using a regular expression because the html cannot be parsed.
totalwebcasting
Jaime Marquínez Ferrándiz 11 years ago
parent
commit
b03d0d064c
1 changed files with 3 additions and 2 deletions
  1. +3
    -2
      youtube_dl/extractor/imdb.py

+ 3
- 2
youtube_dl/extractor/imdb.py View File

@ -38,8 +38,9 @@ class ImdbIE(InfoExtractor):
format_page = self._download_webpage( format_page = self._download_webpage(
compat_urlparse.urljoin(url, f_path), compat_urlparse.urljoin(url, f_path),
u'Downloading info for %s format' % f_id) u'Downloading info for %s format' % f_id)
json_data = get_element_by_attribute('class', 'imdb-player-data',
format_page)
json_data = self._search_regex(
r'<script[^>]+class="imdb-player-data"[^>]*?>(.*?)</script>',
format_page, u'json data', flags=re.DOTALL)
info = json.loads(json_data) info = json.loads(json_data)
format_info = info['videoPlayerObject']['video'] format_info = info['videoPlayerObject']['video']
formats.append({ formats.append({


Loading…
Cancel
Save