commit 8c5879715f4d979b83c49d44a9094307247097ba
parent ebb0449049c198f04103502c95a13171b854d1c7
Author: Alexander Seiler <seileralex@gmail.com>
Date:   Thu,  6 Dec 2018 21:41:02 +0100

[ard:mediathek] Fix title and description extraction (closes #18349)


Diffstat:
Myoutube_dl/extractor/ard.py | 9+++++++--
1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/youtube_dl/extractor/ard.py b/youtube_dl/extractor/ard.py @@ -173,13 +173,18 @@ class ARDMediathekIE(InfoExtractor): title = self._html_search_regex( [r'<h1(?:\s+class="boxTopHeadline")?>(.*?)</h1>', r'<meta name="dcterms\.title" content="(.*?)"/>', - r'<h4 class="headline">(.*?)</h4>'], + r'<h4 class="headline">(.*?)</h4>', + r'<title[^>]*>(.*?)</title>'], webpage, 'title') description = self._html_search_meta( 'dcterms.abstract', webpage, 'description', default=None) if description is None: description = self._html_search_meta( - 'description', webpage, 'meta description') + 'description', webpage, 'meta description', default=None) + if description is None: + description = self._html_search_regex( + r'<p\s+class="teasertext">(.+?)</p>', + webpage, 'teaser text', default=None) # Thumbnail is sometimes not present. # It is in the mobile version, but that seems to use a different URL