diff options
| author | Sergey M․ <dstftw@gmail.com> | 2019-05-23 23:52:11 +0700 | 
|---|---|---|
| committer | Sergey M․ <dstftw@gmail.com> | 2019-05-23 23:52:11 +0700 | 
| commit | f856816b940d95e995c2b9995d01097ab144a1af (patch) | |
| tree | aaa1a8b8ec2c154d33e8ce7d5d2dd066e1066c90 /youtube_dl/extractor/common.py | |
| parent | 8af49fc276b2cf2154b9342de4b4cd66f9d17af9 (diff) | |
[extractor/common] Strip src attribute for HTML5 entries code (closes #18485, closes #21169)
Diffstat (limited to 'youtube_dl/extractor/common.py')
| -rw-r--r-- | youtube_dl/extractor/common.py | 7 | 
1 files changed, 4 insertions, 3 deletions
| diff --git a/youtube_dl/extractor/common.py b/youtube_dl/extractor/common.py index 937237b3f..9c3e9eec6 100644 --- a/youtube_dl/extractor/common.py +++ b/youtube_dl/extractor/common.py @@ -67,6 +67,7 @@ from ..utils import (      sanitized_Request,      sanitize_filename,      str_or_none, +    strip_or_none,      unescapeHTML,      unified_strdate,      unified_timestamp, @@ -2480,7 +2481,7 @@ class InfoExtractor(object):                  'subtitles': {},              }              media_attributes = extract_attributes(media_tag) -            src = media_attributes.get('src') +            src = strip_or_none(media_attributes.get('src'))              if src:                  _, formats = _media_formats(src, media_type)                  media_info['formats'].extend(formats) @@ -2490,7 +2491,7 @@ class InfoExtractor(object):                      s_attr = extract_attributes(source_tag)                      # data-video-src and data-src are non standard but seen                      # several times in the wild -                    src = dict_get(s_attr, ('src', 'data-video-src', 'data-src')) +                    src = strip_or_none(dict_get(s_attr, ('src', 'data-video-src', 'data-src')))                      if not src:                          continue                      f = parse_content_type(s_attr.get('type')) @@ -2533,7 +2534,7 @@ class InfoExtractor(object):                      track_attributes = extract_attributes(track_tag)                      kind = track_attributes.get('kind')                      if not kind or kind in ('subtitles', 'captions'): -                        src = track_attributes.get('src') +                        src = strip_or_none(track_attributes.get('src'))                          if not src:                              continue                          lang = track_attributes.get('srclang') or track_attributes.get('lang') or track_attributes.get('label') | 
