test_all_urls.py 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127
  1. #!/usr/bin/env python3
  2. from __future__ import unicode_literals
  3. # Allow direct execution
  4. import os
  5. import sys
  6. import unittest
  7. import collections
  8. sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
  9. from test.helper import gettestcases
  10. from yt_dlp.extractor import (
  11. FacebookIE,
  12. gen_extractors,
  13. YoutubeIE,
  14. )
  15. class TestAllURLsMatching(unittest.TestCase):
  16. def setUp(self):
  17. self.ies = gen_extractors()
  18. def matching_ies(self, url):
  19. return [ie.IE_NAME for ie in self.ies if ie.suitable(url) and ie.IE_NAME != 'generic']
  20. def assertMatch(self, url, ie_list):
  21. self.assertEqual(self.matching_ies(url), ie_list)
  22. def test_youtube_playlist_matching(self):
  23. assertPlaylist = lambda url: self.assertMatch(url, ['youtube:playlist'])
  24. assertTab = lambda url: self.assertMatch(url, ['youtube:tab'])
  25. assertPlaylist('ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
  26. assertPlaylist('UUBABnxM4Ar9ten8Mdjj1j0Q') # 585
  27. assertPlaylist('PL63F0C78739B09958')
  28. assertTab('https://www.youtube.com/AsapSCIENCE')
  29. assertTab('https://www.youtube.com/embedded')
  30. assertTab('https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q')
  31. assertTab('https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC')
  32. assertTab('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012') # 668
  33. self.assertFalse('youtube:playlist' in self.matching_ies('PLtS2H6bU1M'))
  34. # Top tracks
  35. assertTab('https://www.youtube.com/playlist?list=MCUS.20142101')
  36. def test_youtube_matching(self):
  37. self.assertTrue(YoutubeIE.suitable('PLtS2H6bU1M'))
  38. self.assertFalse(YoutubeIE.suitable('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012')) # 668
  39. self.assertMatch('http://youtu.be/BaW_jenozKc', ['youtube'])
  40. # self.assertMatch('http://www.youtube.com/v/BaW_jenozKc', ['youtube']) # /v/ is no longer valid
  41. self.assertMatch('https://youtube.googleapis.com/v/BaW_jenozKc', ['youtube'])
  42. self.assertMatch('http://www.cleanvideosearch.com/media/action/yt/watch?videoId=8v_4O44sfjM', ['youtube'])
  43. def test_youtube_channel_matching(self):
  44. assertChannel = lambda url: self.assertMatch(url, ['youtube:tab'])
  45. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM')
  46. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM?feature=gb_ch_rec')
  47. assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM/videos')
  48. def test_youtube_user_matching(self):
  49. self.assertMatch('http://www.youtube.com/NASAgovVideo/videos', ['youtube:tab'])
  50. def test_youtube_feeds(self):
  51. self.assertMatch('https://www.youtube.com/feed/library', ['youtube:tab'])
  52. self.assertMatch('https://www.youtube.com/feed/history', ['youtube:tab'])
  53. self.assertMatch('https://www.youtube.com/feed/watch_later', ['youtube:tab'])
  54. self.assertMatch('https://www.youtube.com/feed/subscriptions', ['youtube:tab'])
  55. def test_youtube_search_matching(self):
  56. self.assertMatch('http://www.youtube.com/results?search_query=making+mustard', ['youtube:search_url'])
  57. self.assertMatch('https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video', ['youtube:search_url'])
  58. def test_facebook_matching(self):
  59. self.assertTrue(FacebookIE.suitable('https://www.facebook.com/Shiniknoh#!/photo.php?v=10153317450565268'))
  60. self.assertTrue(FacebookIE.suitable('https://www.facebook.com/cindyweather?fref=ts#!/photo.php?v=10152183998945793'))
  61. def test_no_duplicates(self):
  62. ies = gen_extractors()
  63. for tc in gettestcases(include_onlymatching=True):
  64. url = tc['url']
  65. for ie in ies:
  66. if type(ie).__name__ in ('GenericIE', tc['name'] + 'IE'):
  67. self.assertTrue(ie.suitable(url), '%s should match URL %r' % (type(ie).__name__, url))
  68. else:
  69. self.assertFalse(
  70. ie.suitable(url),
  71. '%s should not match URL %r . That URL belongs to %s.' % (type(ie).__name__, url, tc['name']))
  72. def test_keywords(self):
  73. self.assertMatch(':ytsubs', ['youtube:subscriptions'])
  74. self.assertMatch(':ytsubscriptions', ['youtube:subscriptions'])
  75. self.assertMatch(':ythistory', ['youtube:history'])
  76. def test_vimeo_matching(self):
  77. self.assertMatch('https://vimeo.com/channels/tributes', ['vimeo:channel'])
  78. self.assertMatch('https://vimeo.com/channels/31259', ['vimeo:channel'])
  79. self.assertMatch('https://vimeo.com/channels/31259/53576664', ['vimeo'])
  80. self.assertMatch('https://vimeo.com/user7108434', ['vimeo:user'])
  81. self.assertMatch('https://vimeo.com/user7108434/videos', ['vimeo:user'])
  82. self.assertMatch('https://vimeo.com/user21297594/review/75524534/3c257a1b5d', ['vimeo:review'])
  83. # https://github.com/ytdl-org/youtube-dl/issues/1930
  84. def test_soundcloud_not_matching_sets(self):
  85. self.assertMatch('http://soundcloud.com/floex/sets/gone-ep', ['soundcloud:set'])
  86. def test_tumblr(self):
  87. self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430/orphan-black-dvd-extra-behind-the-scenes', ['Tumblr'])
  88. self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430', ['Tumblr'])
  89. def test_pbs(self):
  90. # https://github.com/ytdl-org/youtube-dl/issues/2350
  91. self.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['pbs'])
  92. self.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['pbs'])
  93. def test_no_duplicated_ie_names(self):
  94. name_accu = collections.defaultdict(list)
  95. for ie in self.ies:
  96. name_accu[ie.IE_NAME.lower()].append(type(ie).__name__)
  97. for (ie_name, ie_list) in name_accu.items():
  98. self.assertEqual(
  99. len(ie_list), 1,
  100. 'Multiple extractors with the same IE_NAME "%s" (%s)' % (ie_name, ', '.join(ie_list)))
  101. if __name__ == '__main__':
  102. unittest.main()