You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

80 lines
2.8 KiB

  1. from __future__ import unicode_literals
  2. from .common import InfoExtractor
  3. from ..utils import remove_end
  4. class ESPNIE(InfoExtractor):
  5. _VALID_URL = r'https?://espn\.go\.com/(?:[^/]+/)*(?P<id>[^/]+)'
  6. _TESTS = [{
  7. 'url': 'http://espn.go.com/video/clip?id=10365079',
  8. 'md5': '60e5d097a523e767d06479335d1bdc58',
  9. 'info_dict': {
  10. 'id': 'FkYWtmazr6Ed8xmvILvKLWjd4QvYZpzG',
  11. 'ext': 'mp4',
  12. 'title': '30 for 30 Shorts: Judging Jewell',
  13. 'description': None,
  14. },
  15. 'params': {
  16. 'skip_download': True,
  17. },
  18. 'add_ie': ['OoyalaExternal'],
  19. }, {
  20. # intl video, from http://www.espnfc.us/video/mls-highlights/150/video/2743663/must-see-moments-best-of-the-mls-season
  21. 'url': 'http://espn.go.com/video/clip?id=2743663',
  22. 'md5': 'f4ac89b59afc7e2d7dbb049523df6768',
  23. 'info_dict': {
  24. 'id': '50NDFkeTqRHB0nXBOK-RGdSG5YQPuxHg',
  25. 'ext': 'mp4',
  26. 'title': 'Must-See Moments: Best of the MLS season',
  27. },
  28. 'params': {
  29. 'skip_download': True,
  30. },
  31. 'add_ie': ['OoyalaExternal'],
  32. }, {
  33. 'url': 'https://espn.go.com/video/iframe/twitter/?cms=espn&id=10365079',
  34. 'only_matching': True,
  35. }, {
  36. 'url': 'http://espn.go.com/nba/recap?gameId=400793786',
  37. 'only_matching': True,
  38. }, {
  39. 'url': 'http://espn.go.com/blog/golden-state-warriors/post/_/id/593/how-warriors-rapidly-regained-a-winning-edge',
  40. 'only_matching': True,
  41. }, {
  42. 'url': 'http://espn.go.com/sports/endurance/story/_/id/12893522/dzhokhar-tsarnaev-sentenced-role-boston-marathon-bombings',
  43. 'only_matching': True,
  44. }, {
  45. 'url': 'http://espn.go.com/nba/playoffs/2015/story/_/id/12887571/john-wall-washington-wizards-no-swelling-left-hand-wrist-game-5-return',
  46. 'only_matching': True,
  47. }]
  48. def _real_extract(self, url):
  49. video_id = self._match_id(url)
  50. webpage = self._download_webpage(url, video_id)
  51. video_id = self._search_regex(
  52. r'class=(["\']).*?video-play-button.*?\1[^>]+data-id=["\'](?P<id>\d+)',
  53. webpage, 'video id', group='id')
  54. cms = 'espn'
  55. if 'data-source="intl"' in webpage:
  56. cms = 'intl'
  57. player_url = 'https://espn.go.com/video/iframe/twitter/?id=%s&cms=%s' % (video_id, cms)
  58. player = self._download_webpage(
  59. player_url, video_id)
  60. pcode = self._search_regex(
  61. r'["\']pcode=([^"\']+)["\']', player, 'pcode')
  62. title = remove_end(
  63. self._og_search_title(webpage),
  64. '- ESPN Video').strip()
  65. return {
  66. '_type': 'url_transparent',
  67. 'url': 'ooyalaexternal:%s:%s:%s' % (cms, video_id, pcode),
  68. 'ie_key': 'OoyalaExternal',
  69. 'title': title,
  70. }