diff options
| author | rzhxeo <rzhxeot7z81b4700@mailcatch.com> | 2013-10-28 17:35:01 +0100 | 
|---|---|---|
| committer | rzhxeo <rzhxeot7z81b4700@mailcatch.com> | 2013-10-28 17:35:01 +0100 | 
| commit | 32a35e441874ad9daba10c29a6a33f13a4953fbb (patch) | |
| tree | 331dca00be6d148edc0b0a322345f6ef48429e8a | |
| parent | 79b3f6122840cf386cde6c9ec13453121944c7b0 (diff) | |
Add support for http://www.extremetube.com
| -rw-r--r-- | youtube_dl/extractor/__init__.py | 1 | ||||
| -rw-r--r-- | youtube_dl/extractor/extremetube.py | 52 | 
2 files changed, 53 insertions, 0 deletions
| diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index 0d933986f..5eed1eebd 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -39,6 +39,7 @@ from .ehow import EHowIE  from .eighttracks import EightTracksIE  from .escapist import EscapistIE  from .exfm import ExfmIE +from .extremetube import ExtremeTubeIE  from .facebook import FacebookIE  from .faz import FazIE  from .fktv import ( diff --git a/youtube_dl/extractor/extremetube.py b/youtube_dl/extractor/extremetube.py new file mode 100644 index 000000000..981de430d --- /dev/null +++ b/youtube_dl/extractor/extremetube.py @@ -0,0 +1,52 @@ +import os +import re + +from .common import InfoExtractor +from ..utils import ( +    compat_urllib_parse_urlparse, +    compat_urllib_request, +    compat_urllib_parse, +) + +class ExtremeTubeIE(InfoExtractor): +    _VALID_URL = r'^(?:https?://)?(?:www\.)?(?P<url>extremetube\.com/video/.+?(?P<videoid>[0-9]+))(?:[/?&]|$)' +    _TEST = { +        u'url': u'http://www.extremetube.com/video/music-video-14-british-euro-brit-european-cumshots-swallow-652431', +        u'file': u'652431.mp4', +        u'md5': u'1fb9228f5e3332ec8c057d6ac36f33e0', +        u'info_dict': { +            u"title": u"Music Video 14 british euro brit european cumshots swallow", +            u"uploader": u"unknown", +            u"age_limit": 18, +        } +    } + +    def _real_extract(self, url): +        mobj = re.match(self._VALID_URL, url) +        video_id = mobj.group('videoid') +        url = 'http://www.' + mobj.group('url') + +        req = compat_urllib_request.Request(url) +        req.add_header('Cookie', 'age_verified=1') +        webpage = self._download_webpage(req, video_id) + +        video_title = self._html_search_regex(r'<h1 [^>]*?title="([^"]+)"[^>]*>\1<', webpage, u'title') +        uploader = self._html_search_regex(r'>Posted by:(?=<)(\s|<[^>]*>)*(.+?)\|', webpage, u'uploader', fatal=False) +        video_url = compat_urllib_parse.unquote(self._html_search_regex(r'video_url=(.+?)&', webpage, u'video_url')) +        path = compat_urllib_parse_urlparse( video_url ).path +        extension = os.path.splitext( path )[1][1:] +        format = path.split('/')[5].split('_')[:2] +        format = "-".join( format ) + +        age_limit = self._rta_search(webpage) + +        return { +            'id': video_id, +            'title': video_title, +            'uploader': uploader, +            'url': video_url, +            'ext': extension, +            'format': format, +            'format_id': format, +            'age_limit': age_limit, +        } | 
