[test_YoutubeDL] Fix test_youtube_format_selection
[youtube-dl] / test / test_YoutubeDL.py
1 #!/usr/bin/env python
2
3 from __future__ import unicode_literals
4
5 # Allow direct execution
6 import os
7 import sys
8 import unittest
9 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
10
11 import copy
12
13 from test.helper import FakeYDL, assertRegexpMatches
14 from youtube_dl import YoutubeDL
15 from youtube_dl.compat import compat_str, compat_urllib_error
16 from youtube_dl.extractor import YoutubeIE
17 from youtube_dl.extractor.common import InfoExtractor
18 from youtube_dl.postprocessor.common import PostProcessor
19 from youtube_dl.utils import ExtractorError, match_filter_func
20
21 TEST_URL = 'http://localhost/sample.mp4'
22
23
24 class YDL(FakeYDL):
25     def __init__(self, *args, **kwargs):
26         super(YDL, self).__init__(*args, **kwargs)
27         self.downloaded_info_dicts = []
28         self.msgs = []
29
30     def process_info(self, info_dict):
31         self.downloaded_info_dicts.append(info_dict)
32
33     def to_screen(self, msg):
34         self.msgs.append(msg)
35
36
37 def _make_result(formats, **kwargs):
38     res = {
39         'formats': formats,
40         'id': 'testid',
41         'title': 'testttitle',
42         'extractor': 'testex',
43     }
44     res.update(**kwargs)
45     return res
46
47
48 class TestFormatSelection(unittest.TestCase):
49     def test_prefer_free_formats(self):
50         # Same resolution => download webm
51         ydl = YDL()
52         ydl.params['prefer_free_formats'] = True
53         formats = [
54             {'ext': 'webm', 'height': 460, 'url': TEST_URL},
55             {'ext': 'mp4', 'height': 460, 'url': TEST_URL},
56         ]
57         info_dict = _make_result(formats)
58         yie = YoutubeIE(ydl)
59         yie._sort_formats(info_dict['formats'])
60         ydl.process_ie_result(info_dict)
61         downloaded = ydl.downloaded_info_dicts[0]
62         self.assertEqual(downloaded['ext'], 'webm')
63
64         # Different resolution => download best quality (mp4)
65         ydl = YDL()
66         ydl.params['prefer_free_formats'] = True
67         formats = [
68             {'ext': 'webm', 'height': 720, 'url': TEST_URL},
69             {'ext': 'mp4', 'height': 1080, 'url': TEST_URL},
70         ]
71         info_dict['formats'] = formats
72         yie = YoutubeIE(ydl)
73         yie._sort_formats(info_dict['formats'])
74         ydl.process_ie_result(info_dict)
75         downloaded = ydl.downloaded_info_dicts[0]
76         self.assertEqual(downloaded['ext'], 'mp4')
77
78         # No prefer_free_formats => prefer mp4 and flv for greater compatibility
79         ydl = YDL()
80         ydl.params['prefer_free_formats'] = False
81         formats = [
82             {'ext': 'webm', 'height': 720, 'url': TEST_URL},
83             {'ext': 'mp4', 'height': 720, 'url': TEST_URL},
84             {'ext': 'flv', 'height': 720, 'url': TEST_URL},
85         ]
86         info_dict['formats'] = formats
87         yie = YoutubeIE(ydl)
88         yie._sort_formats(info_dict['formats'])
89         ydl.process_ie_result(info_dict)
90         downloaded = ydl.downloaded_info_dicts[0]
91         self.assertEqual(downloaded['ext'], 'mp4')
92
93         ydl = YDL()
94         ydl.params['prefer_free_formats'] = False
95         formats = [
96             {'ext': 'flv', 'height': 720, 'url': TEST_URL},
97             {'ext': 'webm', 'height': 720, 'url': TEST_URL},
98         ]
99         info_dict['formats'] = formats
100         yie = YoutubeIE(ydl)
101         yie._sort_formats(info_dict['formats'])
102         ydl.process_ie_result(info_dict)
103         downloaded = ydl.downloaded_info_dicts[0]
104         self.assertEqual(downloaded['ext'], 'flv')
105
106     def test_format_selection(self):
107         formats = [
108             {'format_id': '35', 'ext': 'mp4', 'preference': 1, 'url': TEST_URL},
109             {'format_id': 'example-with-dashes', 'ext': 'webm', 'preference': 1, 'url': TEST_URL},
110             {'format_id': '45', 'ext': 'webm', 'preference': 2, 'url': TEST_URL},
111             {'format_id': '47', 'ext': 'webm', 'preference': 3, 'url': TEST_URL},
112             {'format_id': '2', 'ext': 'flv', 'preference': 4, 'url': TEST_URL},
113         ]
114         info_dict = _make_result(formats)
115
116         ydl = YDL({'format': '20/47'})
117         ydl.process_ie_result(info_dict.copy())
118         downloaded = ydl.downloaded_info_dicts[0]
119         self.assertEqual(downloaded['format_id'], '47')
120
121         ydl = YDL({'format': '20/71/worst'})
122         ydl.process_ie_result(info_dict.copy())
123         downloaded = ydl.downloaded_info_dicts[0]
124         self.assertEqual(downloaded['format_id'], '35')
125
126         ydl = YDL()
127         ydl.process_ie_result(info_dict.copy())
128         downloaded = ydl.downloaded_info_dicts[0]
129         self.assertEqual(downloaded['format_id'], '2')
130
131         ydl = YDL({'format': 'webm/mp4'})
132         ydl.process_ie_result(info_dict.copy())
133         downloaded = ydl.downloaded_info_dicts[0]
134         self.assertEqual(downloaded['format_id'], '47')
135
136         ydl = YDL({'format': '3gp/40/mp4'})
137         ydl.process_ie_result(info_dict.copy())
138         downloaded = ydl.downloaded_info_dicts[0]
139         self.assertEqual(downloaded['format_id'], '35')
140
141         ydl = YDL({'format': 'example-with-dashes'})
142         ydl.process_ie_result(info_dict.copy())
143         downloaded = ydl.downloaded_info_dicts[0]
144         self.assertEqual(downloaded['format_id'], 'example-with-dashes')
145
146     def test_format_selection_audio(self):
147         formats = [
148             {'format_id': 'audio-low', 'ext': 'webm', 'preference': 1, 'vcodec': 'none', 'url': TEST_URL},
149             {'format_id': 'audio-mid', 'ext': 'webm', 'preference': 2, 'vcodec': 'none', 'url': TEST_URL},
150             {'format_id': 'audio-high', 'ext': 'flv', 'preference': 3, 'vcodec': 'none', 'url': TEST_URL},
151             {'format_id': 'vid', 'ext': 'mp4', 'preference': 4, 'url': TEST_URL},
152         ]
153         info_dict = _make_result(formats)
154
155         ydl = YDL({'format': 'bestaudio'})
156         ydl.process_ie_result(info_dict.copy())
157         downloaded = ydl.downloaded_info_dicts[0]
158         self.assertEqual(downloaded['format_id'], 'audio-high')
159
160         ydl = YDL({'format': 'worstaudio'})
161         ydl.process_ie_result(info_dict.copy())
162         downloaded = ydl.downloaded_info_dicts[0]
163         self.assertEqual(downloaded['format_id'], 'audio-low')
164
165         formats = [
166             {'format_id': 'vid-low', 'ext': 'mp4', 'preference': 1, 'url': TEST_URL},
167             {'format_id': 'vid-high', 'ext': 'mp4', 'preference': 2, 'url': TEST_URL},
168         ]
169         info_dict = _make_result(formats)
170
171         ydl = YDL({'format': 'bestaudio/worstaudio/best'})
172         ydl.process_ie_result(info_dict.copy())
173         downloaded = ydl.downloaded_info_dicts[0]
174         self.assertEqual(downloaded['format_id'], 'vid-high')
175
176     def test_format_selection_audio_exts(self):
177         formats = [
178             {'format_id': 'mp3-64', 'ext': 'mp3', 'abr': 64, 'url': 'http://_', 'vcodec': 'none'},
179             {'format_id': 'ogg-64', 'ext': 'ogg', 'abr': 64, 'url': 'http://_', 'vcodec': 'none'},
180             {'format_id': 'aac-64', 'ext': 'aac', 'abr': 64, 'url': 'http://_', 'vcodec': 'none'},
181             {'format_id': 'mp3-32', 'ext': 'mp3', 'abr': 32, 'url': 'http://_', 'vcodec': 'none'},
182             {'format_id': 'aac-32', 'ext': 'aac', 'abr': 32, 'url': 'http://_', 'vcodec': 'none'},
183         ]
184
185         info_dict = _make_result(formats)
186         ydl = YDL({'format': 'best'})
187         ie = YoutubeIE(ydl)
188         ie._sort_formats(info_dict['formats'])
189         ydl.process_ie_result(copy.deepcopy(info_dict))
190         downloaded = ydl.downloaded_info_dicts[0]
191         self.assertEqual(downloaded['format_id'], 'aac-64')
192
193         ydl = YDL({'format': 'mp3'})
194         ie = YoutubeIE(ydl)
195         ie._sort_formats(info_dict['formats'])
196         ydl.process_ie_result(copy.deepcopy(info_dict))
197         downloaded = ydl.downloaded_info_dicts[0]
198         self.assertEqual(downloaded['format_id'], 'mp3-64')
199
200         ydl = YDL({'prefer_free_formats': True})
201         ie = YoutubeIE(ydl)
202         ie._sort_formats(info_dict['formats'])
203         ydl.process_ie_result(copy.deepcopy(info_dict))
204         downloaded = ydl.downloaded_info_dicts[0]
205         self.assertEqual(downloaded['format_id'], 'ogg-64')
206
207     def test_format_selection_video(self):
208         formats = [
209             {'format_id': 'dash-video-low', 'ext': 'mp4', 'preference': 1, 'acodec': 'none', 'url': TEST_URL},
210             {'format_id': 'dash-video-high', 'ext': 'mp4', 'preference': 2, 'acodec': 'none', 'url': TEST_URL},
211             {'format_id': 'vid', 'ext': 'mp4', 'preference': 3, 'url': TEST_URL},
212         ]
213         info_dict = _make_result(formats)
214
215         ydl = YDL({'format': 'bestvideo'})
216         ydl.process_ie_result(info_dict.copy())
217         downloaded = ydl.downloaded_info_dicts[0]
218         self.assertEqual(downloaded['format_id'], 'dash-video-high')
219
220         ydl = YDL({'format': 'worstvideo'})
221         ydl.process_ie_result(info_dict.copy())
222         downloaded = ydl.downloaded_info_dicts[0]
223         self.assertEqual(downloaded['format_id'], 'dash-video-low')
224
225         formats = [
226             {'format_id': 'vid-vcodec-dot', 'ext': 'mp4', 'preference': 1, 'vcodec': 'avc1.123456', 'acodec': 'none', 'url': TEST_URL},
227         ]
228         info_dict = _make_result(formats)
229
230         ydl = YDL({'format': 'bestvideo[vcodec=avc1.123456]'})
231         ydl.process_ie_result(info_dict.copy())
232         downloaded = ydl.downloaded_info_dicts[0]
233         self.assertEqual(downloaded['format_id'], 'vid-vcodec-dot')
234
235     def test_youtube_format_selection(self):
236         order = [
237             '38', '37', '46', '22', '45', '35', '44', '18', '34', '43', '6', '5', '36', '17', '13',
238             # Apple HTTP Live Streaming
239             '96', '95', '94', '93', '92', '132', '151',
240             # 3D
241             '85', '84', '102', '83', '101', '82', '100',
242             # Dash video
243             '137', '248', '136', '247', '135', '246',
244             '245', '244', '134', '243', '133', '242', '160',
245             # Dash audio
246             '141', '172', '140', '171', '139',
247         ]
248
249         def format_info(f_id):
250             info = YoutubeIE._formats[f_id].copy()
251
252             # XXX: In real cases InfoExtractor._parse_mpd() fills up 'acodec'
253             # and 'vcodec', while in tests such information is incomplete since
254             # commit a6c2c24479e5f4827ceb06f64d855329c0a6f593
255             # test_YoutubeDL.test_youtube_format_selection is broken without
256             # this fix
257             if 'acodec' in info and 'vcodec' not in info:
258                 info['vcodec'] = 'none'
259             elif 'vcodec' in info and 'acodec' not in info:
260                 info['acodec'] = 'none'
261
262             info['format_id'] = f_id
263             info['url'] = 'url:' + f_id
264             return info
265         formats_order = [format_info(f_id) for f_id in order]
266
267         info_dict = _make_result(list(formats_order), extractor='youtube')
268         ydl = YDL({'format': 'bestvideo+bestaudio'})
269         yie = YoutubeIE(ydl)
270         yie._sort_formats(info_dict['formats'])
271         ydl.process_ie_result(info_dict)
272         downloaded = ydl.downloaded_info_dicts[0]
273         self.assertEqual(downloaded['format_id'], '137+141')
274         self.assertEqual(downloaded['ext'], 'mp4')
275
276         info_dict = _make_result(list(formats_order), extractor='youtube')
277         ydl = YDL({'format': 'bestvideo[height>=999999]+bestaudio/best'})
278         yie = YoutubeIE(ydl)
279         yie._sort_formats(info_dict['formats'])
280         ydl.process_ie_result(info_dict)
281         downloaded = ydl.downloaded_info_dicts[0]
282         self.assertEqual(downloaded['format_id'], '38')
283
284         info_dict = _make_result(list(formats_order), extractor='youtube')
285         ydl = YDL({'format': 'bestvideo/best,bestaudio'})
286         yie = YoutubeIE(ydl)
287         yie._sort_formats(info_dict['formats'])
288         ydl.process_ie_result(info_dict)
289         downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts]
290         self.assertEqual(downloaded_ids, ['137', '141'])
291
292         info_dict = _make_result(list(formats_order), extractor='youtube')
293         ydl = YDL({'format': '(bestvideo[ext=mp4],bestvideo[ext=webm])+bestaudio'})
294         yie = YoutubeIE(ydl)
295         yie._sort_formats(info_dict['formats'])
296         ydl.process_ie_result(info_dict)
297         downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts]
298         self.assertEqual(downloaded_ids, ['137+141', '248+141'])
299
300         info_dict = _make_result(list(formats_order), extractor='youtube')
301         ydl = YDL({'format': '(bestvideo[ext=mp4],bestvideo[ext=webm])[height<=720]+bestaudio'})
302         yie = YoutubeIE(ydl)
303         yie._sort_formats(info_dict['formats'])
304         ydl.process_ie_result(info_dict)
305         downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts]
306         self.assertEqual(downloaded_ids, ['136+141', '247+141'])
307
308         info_dict = _make_result(list(formats_order), extractor='youtube')
309         ydl = YDL({'format': '(bestvideo[ext=none]/bestvideo[ext=webm])+bestaudio'})
310         yie = YoutubeIE(ydl)
311         yie._sort_formats(info_dict['formats'])
312         ydl.process_ie_result(info_dict)
313         downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts]
314         self.assertEqual(downloaded_ids, ['248+141'])
315
316         for f1, f2 in zip(formats_order, formats_order[1:]):
317             info_dict = _make_result([f1, f2], extractor='youtube')
318             ydl = YDL({'format': 'best/bestvideo'})
319             yie = YoutubeIE(ydl)
320             yie._sort_formats(info_dict['formats'])
321             ydl.process_ie_result(info_dict)
322             downloaded = ydl.downloaded_info_dicts[0]
323             self.assertEqual(downloaded['format_id'], f1['format_id'])
324
325             info_dict = _make_result([f2, f1], extractor='youtube')
326             ydl = YDL({'format': 'best/bestvideo'})
327             yie = YoutubeIE(ydl)
328             yie._sort_formats(info_dict['formats'])
329             ydl.process_ie_result(info_dict)
330             downloaded = ydl.downloaded_info_dicts[0]
331             self.assertEqual(downloaded['format_id'], f1['format_id'])
332
333     def test_invalid_format_specs(self):
334         def assert_syntax_error(format_spec):
335             ydl = YDL({'format': format_spec})
336             info_dict = _make_result([{'format_id': 'foo', 'url': TEST_URL}])
337             self.assertRaises(SyntaxError, ydl.process_ie_result, info_dict)
338
339         assert_syntax_error('bestvideo,,best')
340         assert_syntax_error('+bestaudio')
341         assert_syntax_error('bestvideo+')
342         assert_syntax_error('/')
343
344     def test_format_filtering(self):
345         formats = [
346             {'format_id': 'A', 'filesize': 500, 'width': 1000},
347             {'format_id': 'B', 'filesize': 1000, 'width': 500},
348             {'format_id': 'C', 'filesize': 1000, 'width': 400},
349             {'format_id': 'D', 'filesize': 2000, 'width': 600},
350             {'format_id': 'E', 'filesize': 3000},
351             {'format_id': 'F'},
352             {'format_id': 'G', 'filesize': 1000000},
353         ]
354         for f in formats:
355             f['url'] = 'http://_/'
356             f['ext'] = 'unknown'
357         info_dict = _make_result(formats)
358
359         ydl = YDL({'format': 'best[filesize<3000]'})
360         ydl.process_ie_result(info_dict)
361         downloaded = ydl.downloaded_info_dicts[0]
362         self.assertEqual(downloaded['format_id'], 'D')
363
364         ydl = YDL({'format': 'best[filesize<=3000]'})
365         ydl.process_ie_result(info_dict)
366         downloaded = ydl.downloaded_info_dicts[0]
367         self.assertEqual(downloaded['format_id'], 'E')
368
369         ydl = YDL({'format': 'best[filesize <= ? 3000]'})
370         ydl.process_ie_result(info_dict)
371         downloaded = ydl.downloaded_info_dicts[0]
372         self.assertEqual(downloaded['format_id'], 'F')
373
374         ydl = YDL({'format': 'best [filesize = 1000] [width>450]'})
375         ydl.process_ie_result(info_dict)
376         downloaded = ydl.downloaded_info_dicts[0]
377         self.assertEqual(downloaded['format_id'], 'B')
378
379         ydl = YDL({'format': 'best [filesize = 1000] [width!=450]'})
380         ydl.process_ie_result(info_dict)
381         downloaded = ydl.downloaded_info_dicts[0]
382         self.assertEqual(downloaded['format_id'], 'C')
383
384         ydl = YDL({'format': '[filesize>?1]'})
385         ydl.process_ie_result(info_dict)
386         downloaded = ydl.downloaded_info_dicts[0]
387         self.assertEqual(downloaded['format_id'], 'G')
388
389         ydl = YDL({'format': '[filesize<1M]'})
390         ydl.process_ie_result(info_dict)
391         downloaded = ydl.downloaded_info_dicts[0]
392         self.assertEqual(downloaded['format_id'], 'E')
393
394         ydl = YDL({'format': '[filesize<1MiB]'})
395         ydl.process_ie_result(info_dict)
396         downloaded = ydl.downloaded_info_dicts[0]
397         self.assertEqual(downloaded['format_id'], 'G')
398
399         ydl = YDL({'format': 'all[width>=400][width<=600]'})
400         ydl.process_ie_result(info_dict)
401         downloaded_ids = [info['format_id'] for info in ydl.downloaded_info_dicts]
402         self.assertEqual(downloaded_ids, ['B', 'C', 'D'])
403
404         ydl = YDL({'format': 'best[height<40]'})
405         try:
406             ydl.process_ie_result(info_dict)
407         except ExtractorError:
408             pass
409         self.assertEqual(ydl.downloaded_info_dicts, [])
410
411
412 class TestYoutubeDL(unittest.TestCase):
413     def test_subtitles(self):
414         def s_formats(lang, autocaption=False):
415             return [{
416                 'ext': ext,
417                 'url': 'http://localhost/video.%s.%s' % (lang, ext),
418                 '_auto': autocaption,
419             } for ext in ['vtt', 'srt', 'ass']]
420         subtitles = dict((l, s_formats(l)) for l in ['en', 'fr', 'es'])
421         auto_captions = dict((l, s_formats(l, True)) for l in ['it', 'pt', 'es'])
422         info_dict = {
423             'id': 'test',
424             'title': 'Test',
425             'url': 'http://localhost/video.mp4',
426             'subtitles': subtitles,
427             'automatic_captions': auto_captions,
428             'extractor': 'TEST',
429         }
430
431         def get_info(params={}):
432             params.setdefault('simulate', True)
433             ydl = YDL(params)
434             ydl.report_warning = lambda *args, **kargs: None
435             return ydl.process_video_result(info_dict, download=False)
436
437         result = get_info()
438         self.assertFalse(result.get('requested_subtitles'))
439         self.assertEqual(result['subtitles'], subtitles)
440         self.assertEqual(result['automatic_captions'], auto_captions)
441
442         result = get_info({'writesubtitles': True})
443         subs = result['requested_subtitles']
444         self.assertTrue(subs)
445         self.assertEqual(set(subs.keys()), set(['en']))
446         self.assertTrue(subs['en'].get('data') is None)
447         self.assertEqual(subs['en']['ext'], 'ass')
448
449         result = get_info({'writesubtitles': True, 'subtitlesformat': 'foo/srt'})
450         subs = result['requested_subtitles']
451         self.assertEqual(subs['en']['ext'], 'srt')
452
453         result = get_info({'writesubtitles': True, 'subtitleslangs': ['es', 'fr', 'it']})
454         subs = result['requested_subtitles']
455         self.assertTrue(subs)
456         self.assertEqual(set(subs.keys()), set(['es', 'fr']))
457
458         result = get_info({'writesubtitles': True, 'writeautomaticsub': True, 'subtitleslangs': ['es', 'pt']})
459         subs = result['requested_subtitles']
460         self.assertTrue(subs)
461         self.assertEqual(set(subs.keys()), set(['es', 'pt']))
462         self.assertFalse(subs['es']['_auto'])
463         self.assertTrue(subs['pt']['_auto'])
464
465         result = get_info({'writeautomaticsub': True, 'subtitleslangs': ['es', 'pt']})
466         subs = result['requested_subtitles']
467         self.assertTrue(subs)
468         self.assertEqual(set(subs.keys()), set(['es', 'pt']))
469         self.assertTrue(subs['es']['_auto'])
470         self.assertTrue(subs['pt']['_auto'])
471
472     def test_add_extra_info(self):
473         test_dict = {
474             'extractor': 'Foo',
475         }
476         extra_info = {
477             'extractor': 'Bar',
478             'playlist': 'funny videos',
479         }
480         YDL.add_extra_info(test_dict, extra_info)
481         self.assertEqual(test_dict['extractor'], 'Foo')
482         self.assertEqual(test_dict['playlist'], 'funny videos')
483
484     def test_prepare_filename(self):
485         info = {
486             'id': '1234',
487             'ext': 'mp4',
488             'width': None,
489         }
490
491         def fname(templ):
492             ydl = YoutubeDL({'outtmpl': templ})
493             return ydl.prepare_filename(info)
494         self.assertEqual(fname('%(id)s.%(ext)s'), '1234.mp4')
495         self.assertEqual(fname('%(id)s-%(width)s.%(ext)s'), '1234-NA.mp4')
496         # Replace missing fields with 'NA'
497         self.assertEqual(fname('%(uploader_date)s-%(id)s.%(ext)s'), 'NA-1234.mp4')
498
499     def test_format_note(self):
500         ydl = YoutubeDL()
501         self.assertEqual(ydl._format_note({}), '')
502         assertRegexpMatches(self, ydl._format_note({
503             'vbr': 10,
504         }), '^\s*10k$')
505
506     def test_postprocessors(self):
507         filename = 'post-processor-testfile.mp4'
508         audiofile = filename + '.mp3'
509
510         class SimplePP(PostProcessor):
511             def run(self, info):
512                 with open(audiofile, 'wt') as f:
513                     f.write('EXAMPLE')
514                 return [info['filepath']], info
515
516         def run_pp(params, PP):
517             with open(filename, 'wt') as f:
518                 f.write('EXAMPLE')
519             ydl = YoutubeDL(params)
520             ydl.add_post_processor(PP())
521             ydl.post_process(filename, {'filepath': filename})
522
523         run_pp({'keepvideo': True}, SimplePP)
524         self.assertTrue(os.path.exists(filename), '%s doesn\'t exist' % filename)
525         self.assertTrue(os.path.exists(audiofile), '%s doesn\'t exist' % audiofile)
526         os.unlink(filename)
527         os.unlink(audiofile)
528
529         run_pp({'keepvideo': False}, SimplePP)
530         self.assertFalse(os.path.exists(filename), '%s exists' % filename)
531         self.assertTrue(os.path.exists(audiofile), '%s doesn\'t exist' % audiofile)
532         os.unlink(audiofile)
533
534         class ModifierPP(PostProcessor):
535             def run(self, info):
536                 with open(info['filepath'], 'wt') as f:
537                     f.write('MODIFIED')
538                 return [], info
539
540         run_pp({'keepvideo': False}, ModifierPP)
541         self.assertTrue(os.path.exists(filename), '%s doesn\'t exist' % filename)
542         os.unlink(filename)
543
544     def test_match_filter(self):
545         class FilterYDL(YDL):
546             def __init__(self, *args, **kwargs):
547                 super(FilterYDL, self).__init__(*args, **kwargs)
548                 self.params['simulate'] = True
549
550             def process_info(self, info_dict):
551                 super(YDL, self).process_info(info_dict)
552
553             def _match_entry(self, info_dict, incomplete):
554                 res = super(FilterYDL, self)._match_entry(info_dict, incomplete)
555                 if res is None:
556                     self.downloaded_info_dicts.append(info_dict)
557                 return res
558
559         first = {
560             'id': '1',
561             'url': TEST_URL,
562             'title': 'one',
563             'extractor': 'TEST',
564             'duration': 30,
565             'filesize': 10 * 1024,
566         }
567         second = {
568             'id': '2',
569             'url': TEST_URL,
570             'title': 'two',
571             'extractor': 'TEST',
572             'duration': 10,
573             'description': 'foo',
574             'filesize': 5 * 1024,
575         }
576         videos = [first, second]
577
578         def get_videos(filter_=None):
579             ydl = FilterYDL({'match_filter': filter_})
580             for v in videos:
581                 ydl.process_ie_result(v, download=True)
582             return [v['id'] for v in ydl.downloaded_info_dicts]
583
584         res = get_videos()
585         self.assertEqual(res, ['1', '2'])
586
587         def f(v):
588             if v['id'] == '1':
589                 return None
590             else:
591                 return 'Video id is not 1'
592         res = get_videos(f)
593         self.assertEqual(res, ['1'])
594
595         f = match_filter_func('duration < 30')
596         res = get_videos(f)
597         self.assertEqual(res, ['2'])
598
599         f = match_filter_func('description = foo')
600         res = get_videos(f)
601         self.assertEqual(res, ['2'])
602
603         f = match_filter_func('description =? foo')
604         res = get_videos(f)
605         self.assertEqual(res, ['1', '2'])
606
607         f = match_filter_func('filesize > 5KiB')
608         res = get_videos(f)
609         self.assertEqual(res, ['1'])
610
611     def test_playlist_items_selection(self):
612         entries = [{
613             'id': compat_str(i),
614             'title': compat_str(i),
615             'url': TEST_URL,
616         } for i in range(1, 5)]
617         playlist = {
618             '_type': 'playlist',
619             'id': 'test',
620             'entries': entries,
621             'extractor': 'test:playlist',
622             'extractor_key': 'test:playlist',
623             'webpage_url': 'http://example.com',
624         }
625
626         def get_ids(params):
627             ydl = YDL(params)
628             # make a copy because the dictionary can be modified
629             ydl.process_ie_result(playlist.copy())
630             return [int(v['id']) for v in ydl.downloaded_info_dicts]
631
632         result = get_ids({})
633         self.assertEqual(result, [1, 2, 3, 4])
634
635         result = get_ids({'playlistend': 10})
636         self.assertEqual(result, [1, 2, 3, 4])
637
638         result = get_ids({'playlistend': 2})
639         self.assertEqual(result, [1, 2])
640
641         result = get_ids({'playliststart': 10})
642         self.assertEqual(result, [])
643
644         result = get_ids({'playliststart': 2})
645         self.assertEqual(result, [2, 3, 4])
646
647         result = get_ids({'playlist_items': '2-4'})
648         self.assertEqual(result, [2, 3, 4])
649
650         result = get_ids({'playlist_items': '2,4'})
651         self.assertEqual(result, [2, 4])
652
653         result = get_ids({'playlist_items': '10'})
654         self.assertEqual(result, [])
655
656     def test_urlopen_no_file_protocol(self):
657         # see https://github.com/rg3/youtube-dl/issues/8227
658         ydl = YDL()
659         self.assertRaises(compat_urllib_error.URLError, ydl.urlopen, 'file:///etc/passwd')
660
661     def test_do_not_override_ie_key_in_url_transparent(self):
662         ydl = YDL()
663
664         class Foo1IE(InfoExtractor):
665             _VALID_URL = r'foo1:'
666
667             def _real_extract(self, url):
668                 return {
669                     '_type': 'url_transparent',
670                     'url': 'foo2:',
671                     'ie_key': 'Foo2',
672                 }
673
674         class Foo2IE(InfoExtractor):
675             _VALID_URL = r'foo2:'
676
677             def _real_extract(self, url):
678                 return {
679                     '_type': 'url',
680                     'url': 'foo3:',
681                     'ie_key': 'Foo3',
682                 }
683
684         class Foo3IE(InfoExtractor):
685             _VALID_URL = r'foo3:'
686
687             def _real_extract(self, url):
688                 return _make_result([{'url': TEST_URL}])
689
690         ydl.add_info_extractor(Foo1IE(ydl))
691         ydl.add_info_extractor(Foo2IE(ydl))
692         ydl.add_info_extractor(Foo3IE(ydl))
693         ydl.extract_info('foo1:')
694         downloaded = ydl.downloaded_info_dicts[0]
695         self.assertEqual(downloaded['url'], TEST_URL)
696
697
698 if __name__ == '__main__':
699     unittest.main()