diff options
| author | Muratcan Simsek <mail@muratcansimsek.com> | 2015-12-07 00:15:19 +0200 | 
|---|---|---|
| committer | Sergey M․ <dstftw@gmail.com> | 2015-12-11 23:00:35 +0600 | 
| commit | ab4bdc913fafc71217c1196602525e0382c4eea3 (patch) | |
| tree | 7268ac241b100cc037ee2fef034dd6c696f770b5 | |
| parent | 1fe248a51b4d03a91302b6a0c272b5fdc116f167 (diff) | |
[funimation] Add new extractor
Update funimation.py
Update funimation.py
Removed unnecessary lines.
Update funimation.py
Added thumbnail and description.
Filename improvement.
fixed TEST.
| -rw-r--r-- | youtube_dl/extractor/__init__.py | 1 | ||||
| -rw-r--r-- | youtube_dl/extractor/funimation.py | 77 | 
2 files changed, 78 insertions, 0 deletions
| diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index 3db5cd6d9..3cd95ba01 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -206,6 +206,7 @@ from .francetv import (  from .freesound import FreesoundIE  from .freespeech import FreespeechIE  from .freevideo import FreeVideoIE +from .funimation import FunimationIE  from .funnyordie import FunnyOrDieIE  from .gameinformer import GameInformerIE  from .gamekings import GamekingsIE diff --git a/youtube_dl/extractor/funimation.py b/youtube_dl/extractor/funimation.py new file mode 100644 index 000000000..773d80fe8 --- /dev/null +++ b/youtube_dl/extractor/funimation.py @@ -0,0 +1,77 @@ +# coding: utf-8 +from __future__ import unicode_literals +from .common import InfoExtractor +from ..compat import compat_HTTPError +from ..utils import ( +    encode_dict, +    sanitized_Request, +    ExtractorError, +    urlencode_postdata +) +import re + +class FunimationIE(InfoExtractor): +    _VALID_URL = r'https?://(?:www\.)?funimation\.com/shows/.+[^ ]/videos/official/(?P<id>[^?]+)' + +    _TEST = { +        'url': 'http://www.funimation.com/shows/air/videos/official/breeze', +        'info_dict': { +            'id': 'AIRENG0001', +            'title': 'Air - 1 - Breeze ', +            'ext': 'mp4', +            'thumbnail': 'http://www.funimation.com/admin/uploads/default/recap_thumbnails/7555590/home_spotlight/AIR0001.jpg', +            'description': 'Travelling puppeteer Yukito arrives in a small town where he hopes to earn money through the magic of his puppets. When a young girl named Misuzu lures him to her home with the promise of food, his life changes forever. ', +        } +    } + +    def _login(self): +        (username, password) = self._get_login_info() +        if username is None: +            return +        login_url = 'http://www.funimation.com/login' +        data = urlencode_postdata(encode_dict({ +            'loginForm2': 'loginform', +            'email_field': username, +            'password_field': password, +        })) +        login_request = sanitized_Request(login_url, data) +        login_request.add_header('Content-Type', 'application/x-www-form-urlencoded') +        try: +            login = self._download_webpage(login_request, login_url) +        except ExtractorError as e: +            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403: +                raise ExtractorError('Funimation is not available in your region.', expected=True) +            raise +        if re.search(r'<meta property="og:url" content="http://www.funimation.com/login"/>', login) is not None: +                raise ExtractorError('Unable to login, wrong username or password.', expected=True) + +    def _real_initialize(self): +        self._login() + +    def _real_extract(self, url): +        mobj = re.match(self._VALID_URL, url) +        video_id = mobj.group('id') +        try: +            webpage = self._download_webpage(url, video_id) +        except ExtractorError as e: +            if isinstance(e.cause, compat_HTTPError) and e.cause.code == 403: +                raise ExtractorError('Funimation is not available in your region.', expected=True) +            raise +        if re.search(r'"sdUrl":"http', webpage) is None: +                raise ExtractorError('You are not logged-in or the stream requires subscription.', expected=True) + +        m3u8 = self._search_regex(r'".+Url":"(.+?m3u8)"', webpage, 'm3u8') + self._search_regex(r'"authToken":"(.+?)"', webpage, 'm3u8') +        formats = self._extract_m3u8_formats(m3u8.replace('\\', ''), video_id, ext='mp4', entry_protocol='m3u8_native') + +        video_show = self._search_regex(r'"artist":"(.+?)"', webpage, 'video_show') +        video_track = self._search_regex(r'"videoNumber":"(\d+).0"', webpage, 'video_track') +        video_title = self._search_regex(r'"title":"({0}.+?)"'.format(video_track), webpage, 'video_title') +        video_id = self._search_regex(r'"FUNImationID":"(.+?)"', webpage, 'video_id') + +        return { +            'id': video_id, +            'title': video_show + ' - ' + video_title + ' ', +            'formats': formats, +            'thumbnail': self._og_search_thumbnail(webpage), +            'description': self._og_search_description(webpage) +        } | 
