From: Benjamin Congdon Date: Fri, 11 Mar 2016 15:31:35 +0000 (-0600) Subject: [bbc] Fix BBC Extractor to work with 'School Report' X-Git-Url: http://git.bitcoin.ninja/?a=commitdiff_plain;h=8e4aa7bf18af4403bf98742270483f3b9cfbdeb6;p=youtube-dl [bbc] Fix BBC Extractor to work with 'School Report' --- diff --git a/youtube_dl/extractor/bbc.py b/youtube_dl/extractor/bbc.py index 9d0dfb961..f4d8b4a2f 100644 --- a/youtube_dl/extractor/bbc.py +++ b/youtube_dl/extractor/bbc.py @@ -10,7 +10,6 @@ from ..utils import ( int_or_none, parse_duration, parse_iso8601, - remove_end, unescapeHTML, ) from ..compat import ( @@ -796,9 +795,15 @@ class BBCIE(BBCCoUkIE): entries.append(self._extract_from_playlist_sxml( playlist.get('progressiveDownloadUrl'), playlist_id, timestamp)) + playlist_title = self._og_search_title(webpage, default=None) + playlist_title = playlist_title or self._html_search_regex( + r'(.*?)', webpage, 'playlist title') + + playlist_title = self._search_regex(r'(.+)\s*-\s*BBC', playlist_title, 'title', default=playlist_title) + + playlist_description = self._og_search_description(webpage, default=None) + if entries: - playlist_title = playlist_title or remove_end(self._og_search_title(webpage), ' - BBC News') - playlist_description = playlist_description or self._og_search_description(webpage, default=None) return self.playlist_result(entries, playlist_id, playlist_title, playlist_description) # single video story (e.g. http://www.bbc.com/travel/story/20150625-sri-lankas-spicy-secret) @@ -829,10 +834,6 @@ class BBCIE(BBCCoUkIE): 'subtitles': subtitles, } - playlist_title = self._html_search_regex( - r'(.*?)(?:\s*-\s*BBC [^ ]+)?', webpage, 'playlist title') - playlist_description = self._og_search_description(webpage, default=None) - def extract_all(pattern): return list(filter(None, map( lambda s: self._parse_json(s, playlist_id, fatal=False),