diff options
Diffstat (limited to 'youtube_dl/extractor/vice.py')
| -rw-r--r-- | youtube_dl/extractor/vice.py | 37 | 
1 files changed, 20 insertions, 17 deletions
| diff --git a/youtube_dl/extractor/vice.py b/youtube_dl/extractor/vice.py index 04e2b0ba7..01af7a995 100644 --- a/youtube_dl/extractor/vice.py +++ b/youtube_dl/extractor/vice.py @@ -1,5 +1,4 @@  from __future__ import unicode_literals -import re  from .common import InfoExtractor  from .ooyala import OoyalaIE @@ -7,25 +6,29 @@ from ..utils import ExtractorError  class ViceIE(InfoExtractor): -    _VALID_URL = r'http://www\.vice\.com/.*?/(?P<name>.+)' +    _VALID_URL = r'https?://(?:.+?\.)?vice\.com/(?:[^/]+/)+(?P<id>.+)' -    _TEST = { -        'url': 'http://www.vice.com/Fringes/cowboy-capitalists-part-1', -        'info_dict': { -            'id': '43cW1mYzpia9IlestBjVpd23Yu3afAfp', -            'ext': 'mp4', -            'title': 'VICE_COWBOYCAPITALISTS_PART01_v1_VICE_WM_1080p.mov', -        }, -        'params': { -            # Requires ffmpeg (m3u8 manifest) -            'skip_download': True, -        }, -    } +    _TESTS = [ +        { +            'url': 'http://www.vice.com/Fringes/cowboy-capitalists-part-1', +            'info_dict': { +                'id': '43cW1mYzpia9IlestBjVpd23Yu3afAfp', +                'ext': 'mp4', +                'title': 'VICE_COWBOYCAPITALISTS_PART01_v1_VICE_WM_1080p.mov', +            }, +            'params': { +                # Requires ffmpeg (m3u8 manifest) +                'skip_download': True, +            }, +        }, { +            'url': 'https://news.vice.com/video/experimenting-on-animals-inside-the-monkey-lab', +            'only_matching': True, +        } +    ]      def _real_extract(self, url): -        mobj = re.match(self._VALID_URL, url) -        name = mobj.group('name') -        webpage = self._download_webpage(url, name) +        video_id = self._match_id(url) +        webpage = self._download_webpage(url, video_id)          try:              embed_code = self._search_regex(                  r'embedCode=([^&\'"]+)', webpage, | 
