X-Git-Url: http://git.bitcoin.ninja/index.cgi?a=blobdiff_plain;ds=sidebyside;f=youtube_dl%2Fextractor%2Fnbc.py;h=89a2845fe204695d206d53122585799f9a3e99cd;hb=d236b37ac94cd36657c881e18b8d9187483afa80;hp=3e3de9e2d8c7ffea00415bfd378df43ca1d33135;hpb=d9aa2b784d914ae99c7d9bbaf83d06f1b9dbd04e;p=youtube-dl diff --git a/youtube_dl/extractor/nbc.py b/youtube_dl/extractor/nbc.py index 3e3de9e2d..89a2845fe 100644 --- a/youtube_dl/extractor/nbc.py +++ b/youtube_dl/extractor/nbc.py @@ -1,7 +1,6 @@ from __future__ import unicode_literals import re -import json from .common import InfoExtractor from ..compat import ( @@ -52,9 +51,9 @@ class NBCIE(InfoExtractor): class NBCNewsIE(InfoExtractor): - _VALID_URL = r'''(?x)https?://www\.nbcnews\.com/ - ((video/.+?/(?P\d+))| - ((?Pfeature|nightly-news)/[^/]+/(?P.+))) + _VALID_URL = r'''(?x)https?://(?:www\.)?nbcnews\.com/ + (?:video/.+?/(?P<id>\d+)| + (?:feature|nightly-news)/[^/]+/(?P<title>.+)) ''' _TESTS = [ @@ -120,17 +119,10 @@ class NBCNewsIE(InfoExtractor): # "feature" and "nightly-news" pages use theplatform.com title = mobj.group('title') webpage = self._download_webpage(url, title) - program = mobj.group('program') - if program == 'feature': - bootstrap_json = self._search_regex( - r'var bootstrapJson = ({.+})\s*$', webpage, 'bootstrap json', - flags=re.MULTILINE) - else: - # nightly-news - bootstrap_json = self._search_regex( - r'var playlistData = ({.+});\s*$', webpage, 'playlist data', - flags=re.MULTILINE) - bootstrap = json.loads(bootstrap_json) + bootstrap_json = self._search_regex( + r'var\s+(?:bootstrapJson|playlistData)\s*=\s*({.+});?\s*$', + webpage, 'bootstrap json', flags=re.MULTILINE) + bootstrap = self._parse_json(bootstrap_json, video_id) info = bootstrap['results'][0]['video'] mpxid = info['mpxId']