diff options
Diffstat (limited to 'youtube_dl/extractor/vk.py')
| -rw-r--r-- | youtube_dl/extractor/vk.py | 35 | 
1 files changed, 27 insertions, 8 deletions
| diff --git a/youtube_dl/extractor/vk.py b/youtube_dl/extractor/vk.py index 0805e3c08..d560a4b5e 100644 --- a/youtube_dl/extractor/vk.py +++ b/youtube_dl/extractor/vk.py @@ -11,6 +11,7 @@ from ..compat import (  )  from ..utils import (      ExtractorError, +    int_or_none,      orderedSet,      sanitized_Request,      str_to_int, @@ -141,10 +142,10 @@ class VKIE(InfoExtractor):              'url': 'https://vk.com/video276849682_170681728',              'info_dict': {                  'id': 'V3K4mi0SYkc', -                'ext': 'mp4', +                'ext': 'webm',                  'title': "DSWD Awards 'Children's Joy Foundation, Inc.' Certificate of Registration and License to Operate",                  'description': 'md5:bf9c26cfa4acdfb146362682edd3827a', -                'duration': 179, +                'duration': 178,                  'upload_date': '20130116',                  'uploader': "Children's Joy Foundation",                  'uploader_id': 'thecjf', @@ -152,6 +153,19 @@ class VKIE(InfoExtractor):              },          },          { +            # video key is extra_data not url\d+ +            'url': 'http://vk.com/video-110305615_171782105', +            'md5': 'e13fcda136f99764872e739d13fac1d1', +            'info_dict': { +                'id': '171782105', +                'ext': 'mp4', +                'title': 'S-Dance, репетиции к The way show', +                'uploader': 'THE WAY SHOW | 17 апреля', +                'upload_date': '20160207', +                'view_count': int, +            }, +        }, +        {              # removed video, just testing that we match the pattern              'url': 'http://vk.com/feed?z=video-43215063_166094326%2Fbb50cacd3177146d7a',              'only_matching': True, @@ -298,12 +312,17 @@ class VKIE(InfoExtractor):              view_count = str_to_int(self._search_regex(                  r'([\d,.]+)', views, 'view count', fatal=False)) -        formats = [{ -            'format_id': k, -            'url': v, -            'width': int(k[len('url'):]), -        } for k, v in data.items() -            if k.startswith('url')] +        formats = [] +        for k, v in data.items(): +            if not k.startswith('url') and k != 'extra_data' or not v: +                continue +            height = int_or_none(self._search_regex( +                r'^url(\d+)', k, 'height', default=None)) +            formats.append({ +                'format_id': k, +                'url': v, +                'height': height, +            })          self._sort_formats(formats)          return { | 
