Skip to content

Commit

Permalink
[ie/massengeschmack.tv] Fix title extraction (yt-dlp#7813)
Browse files Browse the repository at this point in the history
Authored by: sb0stn
  • Loading branch information
sb0stn authored and aalsuwaidi committed Apr 21, 2024
1 parent baaaa7d commit 51ed84c
Showing 1 changed file with 6 additions and 7 deletions.
13 changes: 6 additions & 7 deletions yt_dlp/extractor/massengeschmacktv.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,21 +17,19 @@ class MassengeschmackTVIE(InfoExtractor):

_TEST = {
'url': 'https://massengeschmack.tv/play/fktv202',
'md5': 'a9e054db9c2b5a08f0a0527cc201e8d3',
'md5': '9996f314994a49fefe5f39aa1b07ae21',
'info_dict': {
'id': 'fktv202',
'ext': 'mp4',
'title': 'Fernsehkritik-TV - Folge 202',
'title': 'Fernsehkritik-TV #202',
'thumbnail': 'https://cache.massengeschmack.tv/img/mag/fktv202.jpg'
},
}

def _real_extract(self, url):
episode = self._match_id(url)

webpage = self._download_webpage(url, episode)
title = clean_html(self._html_search_regex(
'<h3>([^<]+)</h3>', webpage, 'title'))
thumbnail = self._search_regex(r'POSTER\s*=\s*"([^"]+)', webpage, 'thumbnail', fatal=False)
sources = self._parse_json(self._search_regex(r'(?s)MEDIA\s*=\s*(\[.+?\]);', webpage, 'media'), episode, js_to_json)

formats = []
Expand Down Expand Up @@ -67,7 +65,8 @@ def _real_extract(self, url):

return {
'id': episode,
'title': title,
'title': clean_html(self._html_search_regex(
r'<span[^>]+\bid=["\']clip-title["\'][^>]*>([^<]+)', webpage, 'title', fatal=False)),
'formats': formats,
'thumbnail': thumbnail,
'thumbnail': self._search_regex(r'POSTER\s*=\s*"([^"]+)', webpage, 'thumbnail', fatal=False),
}

0 comments on commit 51ed84c

Please sign in to comment.