diff options
author | Sergey M․ <dstftw@gmail.com> | 2015-02-14 17:42:12 +0600 |
---|---|---|
committer | Sergey M․ <dstftw@gmail.com> | 2015-02-14 17:42:12 +0600 |
commit | a4f3d779db13ec3c8bda67e897de8cd849a7f811 (patch) | |
tree | cb3c815f51175a293aa2014a0b5d87eea4375bec | |
parent | d9aa2b784d914ae99c7d9bbaf83d06f1b9dbd04e (diff) |
[nbcnews] Simplify
-rw-r--r-- | youtube_dl/extractor/nbc.py | 21 |
1 files changed, 7 insertions, 14 deletions
diff --git a/youtube_dl/extractor/nbc.py b/youtube_dl/extractor/nbc.py index 3e3de9e2d..52e8595ea 100644 --- a/youtube_dl/extractor/nbc.py +++ b/youtube_dl/extractor/nbc.py @@ -52,9 +52,9 @@ class NBCIE(InfoExtractor): class NBCNewsIE(InfoExtractor): - _VALID_URL = r'''(?x)https?://www\.nbcnews\.com/ - ((video/.+?/(?P<id>\d+))| - ((?P<program>feature|nightly-news)/[^/]+/(?P<title>.+))) + _VALID_URL = r'''(?x)https?://(?:www\.)?nbcnews\.com/ + (?:video/.+?/(?P<id>\d+)| + (?:feature|nightly-news)/[^/]+/(?P<title>.+)) ''' _TESTS = [ @@ -120,17 +120,10 @@ class NBCNewsIE(InfoExtractor): # "feature" and "nightly-news" pages use theplatform.com title = mobj.group('title') webpage = self._download_webpage(url, title) - program = mobj.group('program') - if program == 'feature': - bootstrap_json = self._search_regex( - r'var bootstrapJson = ({.+})\s*$', webpage, 'bootstrap json', - flags=re.MULTILINE) - else: - # nightly-news - bootstrap_json = self._search_regex( - r'var playlistData = ({.+});\s*$', webpage, 'playlist data', - flags=re.MULTILINE) - bootstrap = json.loads(bootstrap_json) + bootstrap_json = self._search_regex( + r'var\s+(?:bootstrapJson|playlistData)\s*=\s*({.+});?\s*$', + webpage, 'bootstrap json', flags=re.MULTILINE) + bootstrap = self._parse_json(bootstrap_json, video_id) info = bootstrap['results'][0]['video'] mpxid = info['mpxId'] |