yt-dlc/yt_dlp/downloader/youtube_live_chat.py

from __future__ import division, unicode_literals

import json

from .fragment import FragmentFD
from ..compat import compat_urllib_error
from ..utils import (
    try_get,
    RegexNotFoundError,
)
from ..extractor.youtube import YoutubeBaseInfoExtractor as YT_BaseIE


class YoutubeLiveChatReplayFD(FragmentFD):
    """ Downloads YouTube live chat replays fragment by fragment """

    FD_NAME = 'youtube_live_chat_replay'

    def real_download(self, filename, info_dict):
        video_id = info_dict['video_id']
        self.to_screen('[%s] Downloading live chat' % self.FD_NAME)

        fragment_retries = self.params.get('fragment_retries', 0)
        test = self.params.get('test', False)

        ctx = {
            'filename': filename,
            'live': True,
            'total_frags': None,
        }

        ie = YT_BaseIE(self.ydl)

        def dl_fragment(url, data=None, headers=None):
            http_headers = info_dict.get('http_headers', {})
            if headers:
                http_headers = http_headers.copy()
                http_headers.update(headers)
            return self._download_fragment(ctx, url, info_dict, http_headers, data)

        def download_and_parse_fragment(url, frag_index, request_data):
            count = 0
            while count <= fragment_retries:
                try:
                    success, raw_fragment = dl_fragment(url, request_data, {'content-type': 'application/json'})
                    if not success:
                        return False, None, None
                    try:
                        data = ie._extract_yt_initial_data(video_id, raw_fragment.decode('utf-8', 'replace'))
                    except RegexNotFoundError:
                        data = None
                    if not data:
                        data = json.loads(raw_fragment)
                    live_chat_continuation = try_get(
                        data,
                        lambda x: x['continuationContents']['liveChatContinuation'], dict) or {}
                    offset = continuation_id = None
                    processed_fragment = bytearray()
                    for action in live_chat_continuation.get('actions', []):
                        if 'replayChatItemAction' in action:
                            replay_chat_item_action = action['replayChatItemAction']
                            offset = int(replay_chat_item_action['videoOffsetTimeMsec'])
                        processed_fragment.extend(
                            json.dumps(action, ensure_ascii=False).encode('utf-8') + b'\n')
                    if offset is not None:
                        continuation_id = try_get(
                            live_chat_continuation,
                            lambda x: x['continuations'][0]['liveChatReplayContinuationData']['continuation'])
                    self._append_fragment(ctx, processed_fragment)

                    return True, continuation_id, offset
                except compat_urllib_error.HTTPError as err:
                    count += 1
                    if count <= fragment_retries:
                        self.report_retry_fragment(err, frag_index, count, fragment_retries)
            if count > fragment_retries:
                self.report_error('giving up after %s fragment retries' % fragment_retries)
                return False, None, None

        self._prepare_and_start_frag_download(ctx)

        success, raw_fragment = dl_fragment(info_dict['url'])
        if not success:
            return False
        try:
            data = ie._extract_yt_initial_data(video_id, raw_fragment.decode('utf-8', 'replace'))
        except RegexNotFoundError:
            return False
        continuation_id = try_get(
            data,
            lambda x: x['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation'])
        # no data yet but required to call _append_fragment
        self._append_fragment(ctx, b'')

        ytcfg = ie._extract_ytcfg(video_id, raw_fragment.decode('utf-8', 'replace'))

        if not ytcfg:
            return False
        api_key = try_get(ytcfg, lambda x: x['INNERTUBE_API_KEY'])
        innertube_context = try_get(ytcfg, lambda x: x['INNERTUBE_CONTEXT'])
        if not api_key or not innertube_context:
            return False
        url = 'https://www.youtube.com/youtubei/v1/live_chat/get_live_chat_replay?key=' + api_key

        frag_index = offset = 0
        while continuation_id is not None:
            frag_index += 1
            request_data = {
                'context': innertube_context,
                'continuation': continuation_id,
            }
            if frag_index > 1:
                request_data['currentPlayerState'] = {'playerOffsetMs': str(max(offset - 5000, 0))}
            success, continuation_id, offset = download_and_parse_fragment(
                url, frag_index, json.dumps(request_data, ensure_ascii=False).encode('utf-8') + b'\n')
            if not success:
                return False
            if test:
                break

        self._finish_frag_download(ctx)
        return True
support youtube live chat replay 4 years ago			`from __future__ import division, unicode_literals`

			`import json`

			`from .fragment import FragmentFD`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`from ..compat import compat_urllib_error`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`from ..utils import (`
			`try_get,`
			`RegexNotFoundError,`
			`)`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`from ..extractor.youtube import YoutubeBaseInfoExtractor as YT_BaseIE`
support youtube live chat replay 4 years ago

			`class YoutubeLiveChatReplayFD(FragmentFD):`
			`""" Downloads YouTube live chat replays fragment by fragment """`

			`FD_NAME = 'youtube_live_chat_replay'`

			`def real_download(self, filename, info_dict):`
			`video_id = info_dict['video_id']`
			`self.to_screen('[%s] Downloading live chat' % self.FD_NAME)`

[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`fragment_retries = self.params.get('fragment_retries', 0)`
support youtube live chat replay 4 years ago			`test = self.params.get('test', False)`

			`ctx = {`
			`'filename': filename,`
			`'live': True,`
			`'total_frags': None,`
			`}`

#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`ie = YT_BaseIE(self.ydl)`
support youtube live chat replay 4 years ago
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`def dl_fragment(url, data=None, headers=None):`
			`http_headers = info_dict.get('http_headers', {})`
			`if headers:`
			`http_headers = http_headers.copy()`
			`http_headers.update(headers)`
			`return self._download_fragment(ctx, url, info_dict, http_headers, data)`
support youtube live chat replay 4 years ago
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`def download_and_parse_fragment(url, frag_index, request_data):`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`count = 0`
			`while count <= fragment_retries:`
			`try:`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`success, raw_fragment = dl_fragment(url, request_data, {'content-type': 'application/json'})`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`if not success:`
			`return False, None, None`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`try:`
			`data = ie._extract_yt_initial_data(video_id, raw_fragment.decode('utf-8', 'replace'))`
			`except RegexNotFoundError:`
			`data = None`
[youtube_live_chat] Improve extraction :ci skip dl 4 years ago			`if not data:`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`data = json.loads(raw_fragment)`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`live_chat_continuation = try_get(`
			`data,`
			`lambda x: x['continuationContents']['liveChatContinuation'], dict) or {}`
			`offset = continuation_id = None`
			`processed_fragment = bytearray()`
			`for action in live_chat_continuation.get('actions', []):`
			`if 'replayChatItemAction' in action:`
			`replay_chat_item_action = action['replayChatItemAction']`
			`offset = int(replay_chat_item_action['videoOffsetTimeMsec'])`
			`processed_fragment.extend(`
			`json.dumps(action, ensure_ascii=False).encode('utf-8') + b'\n')`
			`if offset is not None:`
			`continuation_id = try_get(`
			`live_chat_continuation,`
			`lambda x: x['continuations'][0]['liveChatReplayContinuationData']['continuation'])`
			`self._append_fragment(ctx, processed_fragment)`

			`return True, continuation_id, offset`
			`except compat_urllib_error.HTTPError as err:`
			`count += 1`
			`if count <= fragment_retries:`
			`self.report_retry_fragment(err, frag_index, count, fragment_retries)`
			`if count > fragment_retries:`
			`self.report_error('giving up after %s fragment retries' % fragment_retries)`
			`return False, None, None`

support youtube live chat replay 4 years ago			`self._prepare_and_start_frag_download(ctx)`

[youtube_live_chat] fix bug when trying to set cookies Closes #194 4 years ago			`success, raw_fragment = dl_fragment(info_dict['url'])`
support youtube live chat replay 4 years ago			`if not success:`
			`return False`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`try:`
			`data = ie._extract_yt_initial_data(video_id, raw_fragment.decode('utf-8', 'replace'))`
			`except RegexNotFoundError:`
			`return False`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`continuation_id = try_get(`
			`data,`
			`lambda x: x['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation'])`
support youtube live chat replay 4 years ago			`# no data yet but required to call _append_fragment`
			`self._append_fragment(ctx, b'')`

#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`ytcfg = ie._extract_ytcfg(video_id, raw_fragment.decode('utf-8', 'replace'))`

			`if not ytcfg:`
			`return False`
			`api_key = try_get(ytcfg, lambda x: x['INNERTUBE_API_KEY'])`
			`innertube_context = try_get(ytcfg, lambda x: x['INNERTUBE_CONTEXT'])`
			`if not api_key or not innertube_context:`
			`return False`
			`url = 'https://www.youtube.com/youtubei/v1/live_chat/get_live_chat_replay?key=' + api_key`

[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`frag_index = offset = 0`
support youtube live chat replay 4 years ago			`while continuation_id is not None:`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`frag_index += 1`
#86 [youtube_live_chat] Use POST API (Closes #82) YouTube has removed support for the old GET based live chat API, and it's now returning 404 Authored by siikamiika 4 years ago			`request_data = {`
			`'context': innertube_context,`
			`'continuation': continuation_id,`
			`}`
			`if frag_index > 1:`
			`request_data['currentPlayerState'] = {'playerOffsetMs': str(max(offset - 5000, 0))}`
			`success, continuation_id, offset = download_and_parse_fragment(`
			`url, frag_index, json.dumps(request_data, ensure_ascii=False).encode('utf-8') + b'\n')`
[youtube_live_chat] Fix `parse_yt_initial_data` and add `fragment_retries` :ci skip dl 4 years ago			`if not success:`
			`return False`
			`if test:`
support youtube live chat replay 4 years ago			`break`

			`self._finish_frag_download(ctx)`
			`return True`