diff options
| author | Yen Chi Hsuan <yan12125@gmail.com> | 2016-03-04 14:21:23 +0800 | 
|---|---|---|
| committer | Yen Chi Hsuan <yan12125@gmail.com> | 2016-03-04 14:21:23 +0800 | 
| commit | 8477a6928314cff7957fde55e56a05b2acf76871 (patch) | |
| tree | 9647f179ea417b07e4e2be9440de65feae540a27 | |
| parent | d58cb3ec7e115cf07a6cf6e035cbba2b5c6861fd (diff) | |
| parent | 199e72429106375218902102812e26c2fc6624b5 (diff) | |
Merge branch 'kusi' of https://github.com/mutantmonkey/youtube-dl into mutantmonkey-kusi
| -rw-r--r-- | youtube_dl/extractor/__init__.py | 1 | ||||
| -rw-r--r-- | youtube_dl/extractor/kusi.py | 61 | 
2 files changed, 62 insertions, 0 deletions
diff --git a/youtube_dl/extractor/__init__.py b/youtube_dl/extractor/__init__.py index 037654a23..08b3dc673 100644 --- a/youtube_dl/extractor/__init__.py +++ b/youtube_dl/extractor/__init__.py @@ -340,6 +340,7 @@ from .konserthusetplay import KonserthusetPlayIE  from .kontrtube import KontrTubeIE  from .krasview import KrasViewIE  from .ku6 import Ku6IE +from .kusi import KUSIIE  from .kuwo import (      KuwoIE,      KuwoAlbumIE, diff --git a/youtube_dl/extractor/kusi.py b/youtube_dl/extractor/kusi.py new file mode 100644 index 000000000..20407411b --- /dev/null +++ b/youtube_dl/extractor/kusi.py @@ -0,0 +1,61 @@ +# coding: utf-8 +from __future__ import unicode_literals + +import re + +from .common import InfoExtractor +from ..compat import compat_urllib_parse_unquote_plus +from ..utils import int_or_none + + +class KUSIIE(InfoExtractor): +    _VALID_URL = r'http://(?:www\.)?kusi\.com/(?P<path>story/.+|video\?clipId=(?P<clipId>\d+))' +    _TEST = { +        'url': 'http://www.kusi.com/story/31183873/turko-files-case-closed-put-on-hold', +        'md5': 'f926e7684294cf8cb7bdf8858e1b3988', +        'info_dict': { +            'id': '12203019', +            'ext': 'mp4', +            'title': 'Turko Files: Case Closed! & Put On Hold!', +            'duration': 231000, +        } +    } + +    def _real_extract(self, url): +        mobj = re.match(self._VALID_URL, url) + +        if mobj.group('clipId') is not None: +            video_id = mobj.group('clipId') +        else: +            webpage = self._download_webpage(url, mobj.group('path')) +            video_id = self._html_search_regex(r'"clipId", "(\d+)"', webpage, +                                               'clipId') + +        xml_url = 'http://www.kusi.com/build.asp?buildtype=buildfeaturexml'\ +                  'request&featureType=Clip&featureid={0}&affiliateno=956&'\ +                  'clientgroupid=1&rnd=562461'.format(video_id) +        doc = self._download_xml(xml_url, video_id, +                                 note='Downloading video info', +                                 errnote='Failed to download video info') + +        video_title = doc.find('HEADLINE').text +        duration = int_or_none(doc.find('DURATION'), get_attr='text') +        description = doc.find('ABSTRACT') + +        quality_options = doc.find('{http://search.yahoo.com/mrss/}group').findall('{http://search.yahoo.com/mrss/}content') +        formats = [] +        for quality in quality_options: +            if 'height' in quality.attrib: +                formats.append({ +                    'url': compat_urllib_parse_unquote_plus(quality.attrib['url']), +                    'height': quality.attrib['height'], +                }) +        self._sort_formats(formats) + +        return { +            'id': video_id, +            'title': video_title, +            'description': description, +            'duration': duration, +            'formats': formats, +        }  | 
