aboutsummaryrefslogtreecommitdiff
path: root/youtube_dl/extractor/helsinki.py
blob: 2a54f3cca89d063f321e512554225778c772caff (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
# -*- coding: utf-8 -*-

from __future__ import unicode_literals

import re

from .common import InfoExtractor


class HelsinkiIE(InfoExtractor):
    _VALID_URL = r'https?://video\.helsinki\.fi/Arkisto/flash\.php\?id=(?P<id>\d+)'
    _TEST = {
        'url': 'http://video.helsinki.fi/Arkisto/flash.php?id=20258',
        'md5': 'cd829201b890905682eb194cbdea55d7',
        'info_dict': {
            'id': '20258',
            'ext': 'mp4',
            'title': 'Tietotekniikkafoorumi-iltapäivä',
        }
    }

    def _real_extract(self, url):
        mobj = re.match(self._VALID_URL, url)
        vid = mobj.group('id')
        webpage = self._download_webpage(url, vid)
        formats = []
        mobj = re.search('file=((\w+):[^&]+)', webpage)
        if mobj: formats.append({
            'ext': mobj.group(2),
            'play_path': mobj.group(1),
            'url': 'rtmp://flashvideo.it.helsinki.fi/vod/',
            'player_url': 'http://video.helsinki.fi/player.swf',
            'format_note': 'sd'
        })

        mobj = re.search('hd\.file=((\w+):[^&]+)', webpage)
        if mobj: formats.append({
            'ext': mobj.group(2),
            'play_path': mobj.group(1),
            'url': 'rtmp://flashvideo.it.helsinki.fi/vod/',
            'player_url': 'http://video.helsinki.fi/player.swf',
            'format_note': 'hd'
        })

        return {
            'id': vid,
            'title': self._og_search_title(webpage).replace('Video: ', ''),
            'description': self._og_search_description(webpage),
            'thumbnail': self._og_search_thumbnail(webpage),
            'formats': formats
        }