diff options
| author | Sergey M․ <dstftw@gmail.com> | 2017-04-04 03:05:18 +0700 | 
|---|---|---|
| committer | Sergey M․ <dstftw@gmail.com> | 2017-04-04 03:05:18 +0700 | 
| commit | 2ab0bfcd810b521bcf4de6dd555c0a47e8a69f70 (patch) | |
| tree | 6ef6f6963dd9f991a745c544f5b0bdc728f3adb7 | |
| parent | b022f4f600a2d73c65e569a9f0a19eed47272938 (diff) | |
[vshare] Add extractor (closes #12278)
| -rw-r--r-- | youtube_dl/extractor/extractors.py | 1 | ||||
| -rw-r--r-- | youtube_dl/extractor/vshare.py | 38 | 
2 files changed, 39 insertions, 0 deletions
| diff --git a/youtube_dl/extractor/extractors.py b/youtube_dl/extractor/extractors.py index 13ca1d2cd..7398dceef 100644 --- a/youtube_dl/extractor/extractors.py +++ b/youtube_dl/extractor/extractors.py @@ -1188,6 +1188,7 @@ from .vrv import (      VRVIE,      VRVSeriesIE,  ) +from .vshare import VShareIE  from .medialaan import MedialaanIE  from .vube import VubeIE  from .vuclip import VuClipIE diff --git a/youtube_dl/extractor/vshare.py b/youtube_dl/extractor/vshare.py new file mode 100644 index 000000000..5addbc280 --- /dev/null +++ b/youtube_dl/extractor/vshare.py @@ -0,0 +1,38 @@ +# coding: utf-8 +from __future__ import unicode_literals + +from .common import InfoExtractor + + +class VShareIE(InfoExtractor): +    _VALID_URL = r'https?://(?:www\.)?vshare\.io/[dv]/(?P<id>[^/?#&]+)' +    _TESTS = [{ +        'url': 'https://vshare.io/d/0f64ce6', +        'md5': '16d7b8fef58846db47419199ff1ab3e7', +        'info_dict': { +            'id': '0f64ce6', +            'title': 'vl14062007715967', +            'ext': 'mp4', +        } +    }, { +        'url': 'https://vshare.io/v/0f64ce6/width-650/height-430/1', +        'only_matching': True, +    }] + +    def _real_extract(self, url): +        video_id = self._match_id(url) + +        webpage = self._download_webpage( +            'https://vshare.io/d/%s' % video_id, video_id) + +        title = self._html_search_regex( +            r'(?s)<div id="root-container">(.+?)<br/>', webpage, 'title') +        video_url = self._search_regex( +            r'<a[^>]+href=(["\'])(?P<url>(?:https?:)?//.+?)\1[^>]*>[Cc]lick\s+here', +            webpage, 'video url', group='url') + +        return { +            'id': video_id, +            'title': title, +            'url': video_url, +        } | 
