diff options
author | Sergey M․ <dstftw@gmail.com> | 2017-10-08 21:36:50 +0700 |
---|---|---|
committer | Sergey M․ <dstftw@gmail.com> | 2017-10-08 21:36:50 +0700 |
commit | 89923316210f8e17bb1a085278940e1c56fcff48 (patch) | |
tree | 0c80781aac4b013d985d424e66b20a7074ef5c7c | |
parent | b0dde6686c7110c9c2515a808d803239a81e6505 (diff) |
[wdr] Relax media link regex (closes #14447)
-rw-r--r-- | youtube_dl/extractor/wdr.py | 9 |
1 files changed, 7 insertions, 2 deletions
diff --git a/youtube_dl/extractor/wdr.py b/youtube_dl/extractor/wdr.py index 8bb7362bb..621de1e1e 100644 --- a/youtube_dl/extractor/wdr.py +++ b/youtube_dl/extractor/wdr.py @@ -22,8 +22,13 @@ class WDRBaseIE(InfoExtractor): # for wdrmaus, in a tag with the class "videoButton" (previously a link # to the page in a multiline "videoLink"-tag) json_metadata = self._html_search_regex( - r'class=(?:"(?:mediaLink|wdrrPlayerPlayBtn|videoButton)\b[^"]*"[^>]+|"videoLink\b[^"]*"[\s]*>\n[^\n]*)data-extension="([^"]+)"', - webpage, 'media link', default=None, flags=re.MULTILINE) + r'''(?sx)class= + (?: + (["\'])(?:mediaLink|wdrrPlayerPlayBtn|videoButton)\b.*?\1[^>]+| + (["\'])videoLink\b.*?\2[\s]*>\n[^\n]* + )data-extension=(["\'])(?P<data>(?:(?!\3).)+)\3 + ''', + webpage, 'media link', default=None, group='data') if not json_metadata: return |