diff options
author | MaxReimann <max.reimann@student.hpi.uni-potsdam.de> | 2014-12-21 11:13:59 +0100 |
---|---|---|
committer | MaxReimann <max.reimann@student.hpi.uni-potsdam.de> | 2014-12-21 11:13:59 +0100 |
commit | 3f7421b71b0d7da917a92b6f37985bc26c5dc11d (patch) | |
tree | bab65cc05bb2b2852e5a3d9a7f3291142b1f90cc /youtube_dl | |
parent | ee45625290c678c53b7ee86d2adba40847b79573 (diff) |
fix test and remove lengthy description
Diffstat (limited to 'youtube_dl')
-rw-r--r-- | youtube_dl/extractor/teletask.py | 20 |
1 files changed, 2 insertions, 18 deletions
diff --git a/youtube_dl/extractor/teletask.py b/youtube_dl/extractor/teletask.py index 1c42ac6f4..6920b871e 100644 --- a/youtube_dl/extractor/teletask.py +++ b/youtube_dl/extractor/teletask.py @@ -11,18 +11,12 @@ class TeleTaskIE(InfoExtractor): _VALID_URL = r'http?://(?:www\.)?tele-task\.de/archive/video/html5/(?P<id>[0-9]+)/' _TEST = { 'url': 'http://www.tele-task.de/archive/video/html5/26168/', - 'md5': 'TODO: md5 sum of the first 10241 bytes of the video file (use --test)', + 'md5': '290ef69fb2792e481169c3958dbfbd57', 'info_dict': { 'id': '26168', 'ext': 'mp4', 'title': 'Duplicate Detection', - 'thumbnail': 're:^https?://.*\.jpg$', - 'date': '20141218', - # TODO more properties, either as: - # * A value - # * MD5 checksum; start the string with md5: - # * A regular expression; start the string with re: - # * Any Python type (for example int or float) + 'upload_date': '20141218', } } @@ -30,19 +24,10 @@ class TeleTaskIE(InfoExtractor): video_id = self._match_id(url) webpage = self._download_webpage(url, video_id) - lecture_url = self._html_search_regex( - r'href="([^"]+)" itemprop="name">', webpage, 'title') - lecture_id = re.search("([0-9]+)/",lecture_url).group(1) - overview_page = self._download_webpage("http://www.tele-task.de" + lecture_url, - lecture_id) - title = self._html_search_regex( r'itemprop="name">([^"]+)</a>', webpage, 'title') url = self._html_search_regex( r'class="speaker".*?src="([^"]+)"', webpage, 'video_url', flags=re.DOTALL) - description = self._html_search_regex( - r'Description of the series:</p>([^"]+)</div>', overview_page, - 'description',flags=re.DOTALL) date = self._html_search_regex( r'<td class="label">Date:</td><td>([^"]+)</td>', webpage, 'date') @@ -53,7 +38,6 @@ class TeleTaskIE(InfoExtractor): return { 'id': video_id, 'title': title, - 'description': description, 'url': url, 'upload_date': date, }
\ No newline at end of file |