diff options
author | Allan Zhou <allanzp@gmail.com> | 2013-08-21 00:07:03 -0700 |
---|---|---|
committer | Allan Zhou <allanzp@gmail.com> | 2013-08-21 00:07:03 -0700 |
commit | a3f62b8255120acda6d429d2a3ce53b13e871c5d (patch) | |
tree | 6a1a8707369cd36654be4ef1deb044a1fcce01ba /youtube_dl/extractor/generic.py | |
parent | 37b6d5f684d409365bbac6d3f2b8074b57e643a8 (diff) | |
parent | 6c3e6e88d3aaaea64ca3d96c005da654c89c8a3a (diff) |
Merge remote-tracking branch 'upstream/master'
Diffstat (limited to 'youtube_dl/extractor/generic.py')
-rw-r--r-- | youtube_dl/extractor/generic.py | 12 |
1 files changed, 10 insertions, 2 deletions
diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py index b633e896c..da016f7ee 100644 --- a/youtube_dl/extractor/generic.py +++ b/youtube_dl/extractor/generic.py @@ -107,8 +107,13 @@ class GenericIE(InfoExtractor): return new_url def _real_extract(self, url): - new_url = self._test_redirect(url) - if new_url: return [self.url_result(new_url)] + try: + new_url = self._test_redirect(url) + if new_url: + return [self.url_result(new_url)] + except compat_urllib_error.HTTPError: + # This may be a stupid server that doesn't like HEAD, our UA, or so + pass video_id = url.split('/')[-1] try: @@ -145,6 +150,9 @@ class GenericIE(InfoExtractor): if m_video_type is not None: mobj = re.search(r'<meta.*?property="og:video".*?content="(.*?)"', webpage) if mobj is None: + # HTML5 video + mobj = re.search(r'<video[^<]*>.*?<source .*?src="([^"]+)"', webpage, flags=re.DOTALL) + if mobj is None: raise ExtractorError(u'Invalid URL: %s' % url) # It's possible that one of the regexes |