[tagesschau] fix deprecation warning about inline regex flags

The warning during test_download: DeprecationWarning: Flags not at the start of the expression '(?s)<p[^>]+class="in' (truncated)
5 years ago · 2a0d9305f4
parent 74bb98431e
commit 2a0d9305f4
1 changed files with 5 additions and 5 deletions
--- a/youtube_dl/extractor/tagesschau.py
+++ b/youtube_dl/extractor/tagesschau.py
@ -380,13 +380,13 @@ class TagesschauIE(InfoExtractor):
    # Some old pages still use the old format, so we keep the previous
    # extractor for now.
    def _legacy_extract(self, webpage, display_id, title, webpage_type):
-        DOWNLOAD_REGEX = r'(?s)<p>Wir bieten dieses (?P<kind>Video|Audio) in folgenden Formaten zum Download an:</p>\s*<div class="controls">(?P<links>.*?)</div>\s*<p>'
+        DOWNLOAD_REGEX = r'<p>Wir bieten dieses (?P<kind>Video|Audio) in folgenden Formaten zum Download an:</p>\s*<div class="controls">(?P<links>.*?)</div>\s*<p>'

        if webpage_type == 'website':  # Article
            entries = []
            for num, (entry_title, media_kind, download_text) in enumerate(re.findall(
-                    r'(?s)<p[^>]+class="infotext"[^>]*>\s*(?:<a[^>]+>)?\s*<strong>(.+?)</strong>.*?</p>.*?%s' % DOWNLOAD_REGEX,
-                    webpage), 1):
+                    r'<p[^>]+class="infotext"[^>]*>\s*(?:<a[^>]+>)?\s*<strong>(.+?)</strong>.*?</p>.*?%s' % DOWNLOAD_REGEX,
+                    webpage, flags=re.S), 1):
                entries.append({
                    'id': '%s-%d' % (display_id, num),
                    'title': '%s' % entry_title,
@ -397,9 +397,9 @@ class TagesschauIE(InfoExtractor):
            formats = entries[0]['formats']
        else:  # Assume single video
            download_text = self._search_regex(
-                DOWNLOAD_REGEX, webpage, 'download links', group='links')
+                DOWNLOAD_REGEX, webpage, 'download links', flags=re.S, group='links')
            media_kind = self._search_regex(
-                DOWNLOAD_REGEX, webpage, 'media kind', default='Video', group='kind')
+                DOWNLOAD_REGEX, webpage, 'media kind', default='Video', flags=re.S, group='kind')
            formats = self._legacy_extract_formats(download_text, media_kind)
        thumbnail = self._og_search_thumbnail(webpage)
        description = self._html_search_regex(