You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

177 lines
8.8 KiB

  1. #!/usr/bin/env python
  2. from __future__ import unicode_literals
  3. # Allow direct execution
  4. import os
  5. import sys
  6. import unittest
  7. sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
  8. from test.helper import gettestcases
  9. from youtube_dl.extractor import (
  10. FacebookIE,
  11. gen_extractors,
  12. JustinTVIE,
  13. YoutubeIE,
  14. )
  15. class TestAllURLsMatching(unittest.TestCase):
  16. def setUp(self):
  17. self.ies = gen_extractors()
  18. def matching_ies(self, url):
  19. return [ie.IE_NAME for ie in self.ies if ie.suitable(url) and ie.IE_NAME != 'generic']
  20. def assertMatch(self, url, ie_list):
  21. self.assertEqual(self.matching_ies(url), ie_list)
  22. def test_youtube_playlist_matching(self):
  23. assertPlaylist = lambda url: self.assertMatch(url, ['youtube:playlist'])
  24. assertPlaylist('ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
  25. assertPlaylist('UUBABnxM4Ar9ten8Mdjj1j0Q') #585
  26. assertPlaylist('PL63F0C78739B09958')
  27. assertPlaylist('https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q')
  28. assertPlaylist('https://www.youtube.com/course?list=ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
  29. assertPlaylist('https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC')
  30. assertPlaylist('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012') #668
  31. self.assertFalse('youtube:playlist' in self.matching_ies('PLtS2H6bU1M'))
  32. # Top tracks
  33. assertPlaylist('https://www.youtube.com/playlist?list=MCUS.20142101')
  34. def test_youtube_matching(self):
  35. self.assertTrue(YoutubeIE.suitable('PLtS2H6bU1M'))
  36. self.assertFalse(YoutubeIE.suitable('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012')) #668
  37. self.assertMatch('http://youtu.be/BaW_jenozKc', ['youtube'])
  38. self.assertMatch('http://www.youtube.com/v/BaW_jenozKc', ['youtube'])
  39. self.assertMatch('https://youtube.googleapis.com/v/BaW_jenozKc', ['youtube'])
  40. self.assertMatch('http://www.cleanvideosearch.com/media/action/yt/watch?videoId=8v_4O44sfjM', ['youtube'])
  41. def test_youtube_channel_matching(self):
  42. assertChannel = lambda url: self.assertMatch(url, ['youtube:channel'])
  43. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM')
  44. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM?feature=gb_ch_rec')
  45. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM/videos')
  46. def test_youtube_user_matching(self):
  47. self.assertMatch('www.youtube.com/NASAgovVideo/videos', ['youtube:user'])
  48. def test_youtube_feeds(self):
  49. self.assertMatch('https://www.youtube.com/feed/watch_later', ['youtube:watch_later'])
  50. self.assertMatch('https://www.youtube.com/feed/subscriptions', ['youtube:subscriptions'])
  51. self.assertMatch('https://www.youtube.com/feed/recommended', ['youtube:recommended'])
  52. self.assertMatch('https://www.youtube.com/my_favorites', ['youtube:favorites'])
  53. def test_youtube_show_matching(self):
  54. self.assertMatch('http://www.youtube.com/show/airdisasters', ['youtube:show'])
  55. def test_youtube_search_matching(self):
  56. self.assertMatch('http://www.youtube.com/results?search_query=making+mustard', ['youtube:search_url'])
  57. self.assertMatch('https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video', ['youtube:search_url'])
  58. def test_justin_tv_channelid_matching(self):
  59. self.assertTrue(JustinTVIE.suitable('justin.tv/vanillatv'))
  60. self.assertTrue(JustinTVIE.suitable('twitch.tv/vanillatv'))
  61. self.assertTrue(JustinTVIE.suitable('www.justin.tv/vanillatv'))
  62. self.assertTrue(JustinTVIE.suitable('www.twitch.tv/vanillatv'))
  63. self.assertTrue(JustinTVIE.suitable('http://www.justin.tv/vanillatv'))
  64. self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv'))
  65. self.assertTrue(JustinTVIE.suitable('http://www.justin.tv/vanillatv/'))
  66. self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv/'))
  67. def test_justintv_videoid_matching(self):
  68. self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv/b/328087483'))
  69. def test_justin_tv_chapterid_matching(self):
  70. self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/tsm_theoddone/c/2349361'))
  71. def test_youtube_extract(self):
  72. assertExtractId = lambda url, id: self.assertEqual(YoutubeIE.extract_id(url), id)
  73. assertExtractId('http://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
  74. assertExtractId('https://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
  75. assertExtractId('https://www.youtube.com/watch?feature=player_embedded&v=BaW_jenozKc', 'BaW_jenozKc')
  76. assertExtractId('https://www.youtube.com/watch_popup?v=BaW_jenozKc', 'BaW_jenozKc')
  77. assertExtractId('http://www.youtube.com/watch?v=BaW_jenozKcsharePLED17F32AD9753930', 'BaW_jenozKc')
  78. assertExtractId('BaW_jenozKc', 'BaW_jenozKc')
  79. def test_facebook_matching(self):
  80. self.assertTrue(FacebookIE.suitable('https://www.facebook.com/Shiniknoh#!/photo.php?v=10153317450565268'))
  81. def test_no_duplicates(self):
  82. ies = gen_extractors()
  83. for tc in gettestcases(include_onlymatching=True):
  84. url = tc['url']
  85. for ie in ies:
  86. if type(ie).__name__ in ('GenericIE', tc['name'] + 'IE'):
  87. self.assertTrue(ie.suitable(url), '%s should match URL %r' % (type(ie).__name__, url))
  88. else:
  89. self.assertFalse(ie.suitable(url), '%s should not match URL %r' % (type(ie).__name__, url))
  90. def test_keywords(self):
  91. self.assertMatch(':ytsubs', ['youtube:subscriptions'])
  92. self.assertMatch(':ytsubscriptions', ['youtube:subscriptions'])
  93. self.assertMatch(':ythistory', ['youtube:history'])
  94. self.assertMatch(':thedailyshow', ['ComedyCentralShows'])
  95. self.assertMatch(':tds', ['ComedyCentralShows'])
  96. self.assertMatch(':colbertreport', ['ComedyCentralShows'])
  97. self.assertMatch(':cr', ['ComedyCentralShows'])
  98. def test_vimeo_matching(self):
  99. self.assertMatch('http://vimeo.com/channels/tributes', ['vimeo:channel'])
  100. self.assertMatch('http://vimeo.com/channels/31259', ['vimeo:channel'])
  101. self.assertMatch('http://vimeo.com/channels/31259/53576664', ['vimeo'])
  102. self.assertMatch('http://vimeo.com/user7108434', ['vimeo:user'])
  103. self.assertMatch('http://vimeo.com/user7108434/videos', ['vimeo:user'])
  104. self.assertMatch('https://vimeo.com/user21297594/review/75524534/3c257a1b5d', ['vimeo:review'])
  105. # https://github.com/rg3/youtube-dl/issues/1930
  106. def test_soundcloud_not_matching_sets(self):
  107. self.assertMatch('http://soundcloud.com/floex/sets/gone-ep', ['soundcloud:set'])
  108. def test_tumblr(self):
  109. self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430/orphan-black-dvd-extra-behind-the-scenes', ['Tumblr'])
  110. self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430', ['Tumblr'])
  111. def test_pbs(self):
  112. # https://github.com/rg3/youtube-dl/issues/2350
  113. self.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['PBS'])
  114. self.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['PBS'])
  115. def test_ComedyCentralShows(self):
  116. self.assertMatch(
  117. 'http://thedailyshow.cc.com/extended-interviews/xm3fnq/andrew-napolitano-extended-interview',
  118. ['ComedyCentralShows'])
  119. self.assertMatch(
  120. 'http://thecolbertreport.cc.com/videos/29w6fx/-realhumanpraise-for-fox-news',
  121. ['ComedyCentralShows'])
  122. self.assertMatch(
  123. 'http://thecolbertreport.cc.com/videos/gh6urb/neil-degrasse-tyson-pt--1?xrs=eml_col_031114',
  124. ['ComedyCentralShows'])
  125. self.assertMatch(
  126. 'http://thedailyshow.cc.com/guests/michael-lewis/3efna8/exclusive---michael-lewis-extended-interview-pt--3',
  127. ['ComedyCentralShows'])
  128. self.assertMatch(
  129. 'http://thedailyshow.cc.com/episodes/sy7yv0/april-8--2014---denis-leary',
  130. ['ComedyCentralShows'])
  131. self.assertMatch(
  132. 'http://thecolbertreport.cc.com/episodes/8ase07/april-8--2014---jane-goodall',
  133. ['ComedyCentralShows'])
  134. self.assertMatch(
  135. 'http://thedailyshow.cc.com/video-playlists/npde3s/the-daily-show-19088-highlights',
  136. ['ComedyCentralShows'])
  137. self.assertMatch(
  138. 'http://thedailyshow.cc.com/special-editions/2l8fdb/special-edition---a-look-back-at-food',
  139. ['ComedyCentralShows'])
  140. def test_yahoo_https(self):
  141. # https://github.com/rg3/youtube-dl/issues/2701
  142. self.assertMatch(
  143. 'https://screen.yahoo.com/smartwatches-latest-wearable-gadgets-163745379-cbs.html',
  144. ['Yahoo'])
  145. if __name__ == '__main__':
  146. unittest.main()