[test_all_urls] Simplify
[youtube-dl] / test / test_all_urls.py
1 #!/usr/bin/env python
2
3 from __future__ import unicode_literals
4
5 # Allow direct execution
6 import os
7 import sys
8 import unittest
9 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
10
11
12 from test.helper import gettestcases
13
14 from youtube_dl.extractor import (
15     FacebookIE,
16     gen_extractors,
17     JustinTVIE,
18     PBSIE,
19     YoutubeIE,
20 )
21
22
23 class TestAllURLsMatching(unittest.TestCase):
24     def setUp(self):
25         self.ies = gen_extractors()
26
27     def matching_ies(self, url):
28         return [ie.IE_NAME for ie in self.ies if ie.suitable(url) and ie.IE_NAME != 'generic']
29
30     def assertMatch(self, url, ie_list):
31         self.assertEqual(self.matching_ies(url), ie_list)
32
33     def test_youtube_playlist_matching(self):
34         assertPlaylist = lambda url: self.assertMatch(url, ['youtube:playlist'])
35         assertPlaylist('ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
36         assertPlaylist('UUBABnxM4Ar9ten8Mdjj1j0Q') #585
37         assertPlaylist('PL63F0C78739B09958')
38         assertPlaylist('https://www.youtube.com/playlist?list=UUBABnxM4Ar9ten8Mdjj1j0Q')
39         assertPlaylist('https://www.youtube.com/course?list=ECUl4u3cNGP61MdtwGTqZA0MreSaDybji8')
40         assertPlaylist('https://www.youtube.com/playlist?list=PLwP_SiAcdui0KVebT0mU9Apz359a4ubsC')
41         assertPlaylist('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012') #668
42         self.assertFalse('youtube:playlist' in self.matching_ies('PLtS2H6bU1M'))
43         # Top tracks
44         assertPlaylist('https://www.youtube.com/playlist?list=MCUS.20142101')
45
46     def test_youtube_matching(self):
47         self.assertTrue(YoutubeIE.suitable('PLtS2H6bU1M'))
48         self.assertFalse(YoutubeIE.suitable('https://www.youtube.com/watch?v=AV6J6_AeFEQ&playnext=1&list=PL4023E734DA416012')) #668
49         self.assertMatch('http://youtu.be/BaW_jenozKc', ['youtube'])
50         self.assertMatch('http://www.youtube.com/v/BaW_jenozKc', ['youtube'])
51         self.assertMatch('https://youtube.googleapis.com/v/BaW_jenozKc', ['youtube'])
52         self.assertMatch('http://www.cleanvideosearch.com/media/action/yt/watch?videoId=8v_4O44sfjM', ['youtube'])
53
54     def test_youtube_channel_matching(self):
55         assertChannel = lambda url: self.assertMatch(url, ['youtube:channel'])
56         assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM')
57         assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM?feature=gb_ch_rec')
58         assertChannel('https://www.youtube.com/channel/HCtnHdj3df7iM/videos')
59
60     def test_youtube_user_matching(self):
61         self.assertMatch('www.youtube.com/NASAgovVideo/videos', ['youtube:user'])
62
63     def test_youtube_feeds(self):
64         self.assertMatch('https://www.youtube.com/feed/watch_later', ['youtube:watch_later'])
65         self.assertMatch('https://www.youtube.com/feed/subscriptions', ['youtube:subscriptions'])
66         self.assertMatch('https://www.youtube.com/feed/recommended', ['youtube:recommended'])
67         self.assertMatch('https://www.youtube.com/my_favorites', ['youtube:favorites'])
68
69     def test_youtube_show_matching(self):
70         self.assertMatch('http://www.youtube.com/show/airdisasters', ['youtube:show'])
71
72     def test_youtube_truncated(self):
73         self.assertMatch('http://www.youtube.com/watch?', ['youtube:truncated_url'])
74
75     def test_youtube_search_matching(self):
76         self.assertMatch('http://www.youtube.com/results?search_query=making+mustard', ['youtube:search_url'])
77         self.assertMatch('https://www.youtube.com/results?baz=bar&search_query=youtube-dl+test+video&filters=video&lclk=video', ['youtube:search_url'])
78
79     def test_justin_tv_channelid_matching(self):
80         self.assertTrue(JustinTVIE.suitable('justin.tv/vanillatv'))
81         self.assertTrue(JustinTVIE.suitable('twitch.tv/vanillatv'))
82         self.assertTrue(JustinTVIE.suitable('www.justin.tv/vanillatv'))
83         self.assertTrue(JustinTVIE.suitable('www.twitch.tv/vanillatv'))
84         self.assertTrue(JustinTVIE.suitable('http://www.justin.tv/vanillatv'))
85         self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv'))
86         self.assertTrue(JustinTVIE.suitable('http://www.justin.tv/vanillatv/'))
87         self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv/'))
88
89     def test_justintv_videoid_matching(self):
90         self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/vanillatv/b/328087483'))
91
92     def test_justin_tv_chapterid_matching(self):
93         self.assertTrue(JustinTVIE.suitable('http://www.twitch.tv/tsm_theoddone/c/2349361'))
94
95     def test_youtube_extract(self):
96         assertExtractId = lambda url, id: self.assertEqual(YoutubeIE.extract_id(url), id)
97         assertExtractId('http://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
98         assertExtractId('https://www.youtube.com/watch?&v=BaW_jenozKc', 'BaW_jenozKc')
99         assertExtractId('https://www.youtube.com/watch?feature=player_embedded&v=BaW_jenozKc', 'BaW_jenozKc')
100         assertExtractId('https://www.youtube.com/watch_popup?v=BaW_jenozKc', 'BaW_jenozKc')
101         assertExtractId('http://www.youtube.com/watch?v=BaW_jenozKcsharePLED17F32AD9753930', 'BaW_jenozKc')
102         assertExtractId('BaW_jenozKc', 'BaW_jenozKc')
103
104     def test_facebook_matching(self):
105         self.assertTrue(FacebookIE.suitable('https://www.facebook.com/Shiniknoh#!/photo.php?v=10153317450565268'))
106
107     def test_no_duplicates(self):
108         ies = gen_extractors()
109         for tc in gettestcases():
110             url = tc['url']
111             for ie in ies:
112                 if type(ie).__name__ in ('GenericIE', tc['name'] + 'IE'):
113                     self.assertTrue(ie.suitable(url), '%s should match URL %r' % (type(ie).__name__, url))
114                 else:
115                     self.assertFalse(ie.suitable(url), '%s should not match URL %r' % (type(ie).__name__, url))
116
117     def test_keywords(self):
118         self.assertMatch(':ytsubs', ['youtube:subscriptions'])
119         self.assertMatch(':ytsubscriptions', ['youtube:subscriptions'])
120         self.assertMatch(':ythistory', ['youtube:history'])
121         self.assertMatch(':thedailyshow', ['ComedyCentralShows'])
122         self.assertMatch(':tds', ['ComedyCentralShows'])
123         self.assertMatch(':colbertreport', ['ComedyCentralShows'])
124         self.assertMatch(':cr', ['ComedyCentralShows'])
125
126     def test_vimeo_matching(self):
127         self.assertMatch('http://vimeo.com/channels/tributes', ['vimeo:channel'])
128         self.assertMatch('http://vimeo.com/channels/31259', ['vimeo:channel'])
129         self.assertMatch('http://vimeo.com/channels/31259/53576664', ['vimeo'])
130         self.assertMatch('http://vimeo.com/user7108434', ['vimeo:user'])
131         self.assertMatch('http://vimeo.com/user7108434/videos', ['vimeo:user'])
132         self.assertMatch('https://vimeo.com/user21297594/review/75524534/3c257a1b5d', ['vimeo:review'])
133
134     # https://github.com/rg3/youtube-dl/issues/1930
135     def test_soundcloud_not_matching_sets(self):
136         self.assertMatch('http://soundcloud.com/floex/sets/gone-ep', ['soundcloud:set'])
137
138     def test_tumblr(self):
139         self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430/orphan-black-dvd-extra-behind-the-scenes', ['Tumblr'])
140         self.assertMatch('http://tatianamaslanydaily.tumblr.com/post/54196191430', ['Tumblr'])
141
142     def test_pbs(self):
143         # https://github.com/rg3/youtube-dl/issues/2350
144         self.assertMatch('http://video.pbs.org/viralplayer/2365173446/', ['PBS'])
145         self.assertMatch('http://video.pbs.org/widget/partnerplayer/980042464/', ['PBS'])
146
147     def test_ComedyCentralShows(self):
148         self.assertMatch(
149             'http://thedailyshow.cc.com/extended-interviews/xm3fnq/andrew-napolitano-extended-interview',
150             ['ComedyCentralShows'])
151         self.assertMatch(
152             'http://thecolbertreport.cc.com/videos/29w6fx/-realhumanpraise-for-fox-news',
153             ['ComedyCentralShows'])
154         self.assertMatch(
155             'http://thecolbertreport.cc.com/videos/gh6urb/neil-degrasse-tyson-pt--1?xrs=eml_col_031114',
156             ['ComedyCentralShows'])
157         self.assertMatch(
158             'http://thedailyshow.cc.com/guests/michael-lewis/3efna8/exclusive---michael-lewis-extended-interview-pt--3',
159             ['ComedyCentralShows'])
160         self.assertMatch(
161             'http://thedailyshow.cc.com/episodes/sy7yv0/april-8--2014---denis-leary',
162             ['ComedyCentralShows'])
163         self.assertMatch(
164             'http://thecolbertreport.cc.com/episodes/8ase07/april-8--2014---jane-goodall',
165             ['ComedyCentralShows'])
166         self.assertMatch(
167             'http://thedailyshow.cc.com/video-playlists/npde3s/the-daily-show-19088-highlights',
168             ['ComedyCentralShows'])
169         self.assertMatch(
170             'http://thedailyshow.cc.com/special-editions/2l8fdb/special-edition---a-look-back-at-food',
171             ['ComedyCentralShows'])
172
173     def test_yahoo_https(self):
174         # https://github.com/rg3/youtube-dl/issues/2701
175         self.assertMatch(
176             'https://screen.yahoo.com/smartwatches-latest-wearable-gadgets-163745379-cbs.html',
177             ['Yahoo'])
178
179 if __name__ == '__main__':
180     unittest.main()