|
|
|
@ -1,6 +1,7 @@
|
|
|
|
|
# coding: utf-8
|
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
|
|
import json
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
from .common import InfoExtractor
|
|
|
|
@ -13,6 +14,7 @@ from ..utils import (
|
|
|
|
|
xpath_element,
|
|
|
|
|
xpath_with_ns,
|
|
|
|
|
find_xpath_attr,
|
|
|
|
|
parse_duration,
|
|
|
|
|
parse_iso8601,
|
|
|
|
|
parse_age_limit,
|
|
|
|
|
int_or_none,
|
|
|
|
@ -359,3 +361,63 @@ class CBCWatchIE(CBCWatchBaseIE):
|
|
|
|
|
video_id = self._match_id(url)
|
|
|
|
|
rss = self._call_api('web/browse/' + video_id, video_id)
|
|
|
|
|
return self._parse_rss_feed(rss)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CBCOlympicsIE(InfoExtractor):
|
|
|
|
|
IE_NAME = 'cbc.ca:olympics'
|
|
|
|
|
_VALID_URL = r'https?://olympics\.cbc\.ca/video/[^/]+/(?P<id>[^/?#]+)'
|
|
|
|
|
_TESTS = [{
|
|
|
|
|
'url': 'https://olympics.cbc.ca/video/whats-on-tv/olympic-morning-featuring-the-opening-ceremony/',
|
|
|
|
|
'only_matching': True,
|
|
|
|
|
}]
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
|
|
|
|
display_id = self._match_id(url)
|
|
|
|
|
webpage = self._download_webpage(url, display_id)
|
|
|
|
|
video_id = self._hidden_inputs(webpage)['videoId']
|
|
|
|
|
video_doc = self._download_xml(
|
|
|
|
|
'https://olympics.cbc.ca/videodata/%s.xml' % video_id, video_id)
|
|
|
|
|
title = xpath_text(video_doc, 'title', fatal=True)
|
|
|
|
|
is_live = xpath_text(video_doc, 'kind') == 'Live'
|
|
|
|
|
if is_live:
|
|
|
|
|
title = self._live_title(title)
|
|
|
|
|
|
|
|
|
|
formats = []
|
|
|
|
|
for video_source in video_doc.findall('videoSources/videoSource'):
|
|
|
|
|
uri = xpath_text(video_source, 'uri')
|
|
|
|
|
if not uri:
|
|
|
|
|
continue
|
|
|
|
|
tokenize = self._download_json(
|
|
|
|
|
'https://olympics.cbc.ca/api/api-akamai/tokenize',
|
|
|
|
|
video_id, data=json.dumps({
|
|
|
|
|
'VideoSource': uri,
|
|
|
|
|
}).encode(), headers={
|
|
|
|
|
'Content-Type': 'application/json',
|
|
|
|
|
'Referer': url,
|
|
|
|
|
# d3.VideoPlayer._init in https://olympics.cbc.ca/components/script/base.js
|
|
|
|
|
'Cookie': '_dvp=TK:C0ObxjerU', # AKAMAI CDN cookie
|
|
|
|
|
}, fatal=False)
|
|
|
|
|
if not tokenize:
|
|
|
|
|
continue
|
|
|
|
|
content_url = tokenize['ContentUrl']
|
|
|
|
|
video_source_format = video_source.get('format')
|
|
|
|
|
if video_source_format == 'IIS':
|
|
|
|
|
formats.extend(self._extract_ism_formats(
|
|
|
|
|
content_url, video_id, ism_id=video_source_format, fatal=False))
|
|
|
|
|
else:
|
|
|
|
|
formats.extend(self._extract_m3u8_formats(
|
|
|
|
|
content_url, video_id, 'mp4',
|
|
|
|
|
'm3u8' if is_live else 'm3u8_native',
|
|
|
|
|
m3u8_id=video_source_format, fatal=False))
|
|
|
|
|
self._sort_formats(formats)
|
|
|
|
|
|
|
|
|
|
return {
|
|
|
|
|
'id': video_id,
|
|
|
|
|
'display_id': display_id,
|
|
|
|
|
'title': title,
|
|
|
|
|
'description': xpath_text(video_doc, 'description'),
|
|
|
|
|
'thumbnail': xpath_text(video_doc, 'thumbnailUrl'),
|
|
|
|
|
'duration': parse_duration(xpath_text(video_doc, 'duration')),
|
|
|
|
|
'formats': formats,
|
|
|
|
|
'is_live': is_live,
|
|
|
|
|
}
|
|
|
|
|