From 1b28864bce82d8d1a68fc8495b11d1eb7610a8a5 Mon Sep 17 00:00:00 2001 From: lonm Date: Mon, 9 Dec 2024 16:30:51 +0000 Subject: [PATCH] [RadioFrance] ignore empty episodes --- yt_dlp/extractor/radiofrance.py | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/yt_dlp/extractor/radiofrance.py b/yt_dlp/extractor/radiofrance.py index 31851adb9..89680b305 100644 --- a/yt_dlp/extractor/radiofrance.py +++ b/yt_dlp/extractor/radiofrance.py @@ -277,7 +277,10 @@ class RadioFrancePlaylistBaseIE(RadioFranceBaseIE): break def _extract_embedded_episodes(self, item, webpage, content_id): - """Certain episdoes data are embedded directly in the page, use these if the link is missing""" + """Certain episodes data are embedded directly in the page, use these if the link is missing""" + # this may be empty if the editor uploads a blank 'info' episode. ignore these. + if item['playerInfo']['media'] is None: + return None links = item['playerInfo']['media']['sources'] item['formats'] = [] for linkkey in links: @@ -401,6 +404,9 @@ class RadioFrancePodcastIE(RadioFrancePlaylistBaseIE): if item['model'] == 'Expression': if item['link'] == '': item = self._extract_embedded_episodes(item, webpage, podcast_id) + # If could not extract the right info, skip + if item is None: + continue resp['items'].append(item) # the pagination data is stored in a javascript object 'a' @@ -466,6 +472,9 @@ class RadioFranceProfileIE(RadioFrancePlaylistBaseIE): if item['model'] == 'Expression': if item.link == '': item = self._extract_embedded_episodes(item, webpage, profile_id) + # if could not extract info, skip + if item is None: + continue resp['items'].append(item) resp['metadata'] = self._search_json(r'content:\s*', webpage, profile_id, profile_id,