diff options
author | Alexander Seiler <seileralex@gmail.com> | 2018-12-06 21:41:02 +0100 |
---|---|---|
committer | Sergey M <dstftw@gmail.com> | 2018-12-07 03:41:02 +0700 |
commit | 8c5879715f4d979b83c49d44a9094307247097ba (patch) | |
tree | 0d8c57f4a268ec5f3e44f9bda790c102db3c9293 | |
parent | ebb0449049c198f04103502c95a13171b854d1c7 (diff) |
[ard:mediathek] Fix title and description extraction (closes #18349)
-rw-r--r-- | youtube_dl/extractor/ard.py | 9 |
1 files changed, 7 insertions, 2 deletions
diff --git a/youtube_dl/extractor/ard.py b/youtube_dl/extractor/ard.py index 6bf8f61eb..84e96f769 100644 --- a/youtube_dl/extractor/ard.py +++ b/youtube_dl/extractor/ard.py @@ -173,13 +173,18 @@ class ARDMediathekIE(InfoExtractor): title = self._html_search_regex( [r'<h1(?:\s+class="boxTopHeadline")?>(.*?)</h1>', r'<meta name="dcterms\.title" content="(.*?)"/>', - r'<h4 class="headline">(.*?)</h4>'], + r'<h4 class="headline">(.*?)</h4>', + r'<title[^>]*>(.*?)</title>'], webpage, 'title') description = self._html_search_meta( 'dcterms.abstract', webpage, 'description', default=None) if description is None: description = self._html_search_meta( - 'description', webpage, 'meta description') + 'description', webpage, 'meta description', default=None) + if description is None: + description = self._html_search_regex( + r'<p\s+class="teasertext">(.+?)</p>', + webpage, 'teaser text', default=None) # Thumbnail is sometimes not present. # It is in the mobile version, but that seems to use a different URL |