[GoPro] Add extractor (#1167)

Fixes: https://github.com/ytdl-org/youtube-dl/issues/30044
Authored by: i6t
pull/1179/head
i6t 4 years ago committed by GitHub
parent 0f0ac87be3
commit d92125aeba
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -524,6 +524,7 @@ from .googlepodcasts import (
GooglePodcastsFeedIE, GooglePodcastsFeedIE,
) )
from .googlesearch import GoogleSearchIE from .googlesearch import GoogleSearchIE
from .gopro import GoProIE
from .goshgay import GoshgayIE from .goshgay import GoshgayIE
from .gotostage import GoToStageIE from .gotostage import GoToStageIE
from .gputechconf import GPUTechConfIE from .gputechconf import GPUTechConfIE

@ -0,0 +1,110 @@
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
from ..utils import (
int_or_none,
remove_end,
str_or_none,
try_get,
unified_timestamp,
url_or_none,
)
class GoProIE(InfoExtractor):
_VALID_URL = r'https?://(www\.)?gopro\.com/v/(?P<id>[A-Za-z0-9]+)'
_TESTS = [{
'url': 'https://gopro.com/v/ZNVvED8QDzR5V',
'info_dict': {
'id': 'ZNVvED8QDzR5V',
'title': 'My GoPro Adventure - 9/19/21',
'thumbnail': r're:https?://.+',
'ext': 'mp4',
'timestamp': 1632072947,
'upload_date': '20210919',
'uploader_id': 'fireydive30018',
'duration': 396062,
}
}, {
'url': 'https://gopro.com/v/KRm6Vgp2peg4e',
'info_dict': {
'id': 'KRm6Vgp2peg4e',
'title': 'じゃがいも カリカリ オーブン焼き',
'thumbnail': r're:https?://.+',
'ext': 'mp4',
'timestamp': 1607231125,
'upload_date': '20201206',
'uploader_id': 'dc9bcb8b-47d2-47c6-afbc-4c48f9a3769e',
'duration': 45187,
'track': 'The Sky Machine',
}
}, {
'url': 'https://gopro.com/v/kVrK9wlJvBMwn',
'info_dict': {
'id': 'kVrK9wlJvBMwn',
'title': 'DARKNESS',
'thumbnail': r're:https?://.+',
'ext': 'mp4',
'timestamp': 1594183735,
'upload_date': '20200708',
'uploader_id': '闇夜乃皇帝',
'duration': 313075,
'track': 'Battery (Live)',
'artist': 'Metallica',
}
}]
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
metadata = self._parse_json(
self._html_search_regex(r'window\.__reflectData\s*=\s*([^;]+)', webpage, 'metadata'), video_id)
video_info = metadata['collectionMedia'][0]
media_data = self._download_json(
'https://api.gopro.com/media/%s/download' % video_info['id'], video_id)
formats = []
for fmt in try_get(media_data, lambda x: x['_embedded']['variations']) or []:
format_url = url_or_none(fmt.get('url'))
if not format_url:
continue
formats.append({
'url': format_url,
'format_id': str_or_none(fmt.get('quality')),
'format_note': str_or_none(fmt.get('label')),
'ext': str_or_none(fmt.get('type')),
'width': int_or_none(fmt.get('width')),
'height': int_or_none(fmt.get('height')),
})
self._sort_formats(formats)
title = str_or_none(
try_get(metadata, lambda x: x['collection']['title'])
or self._html_search_meta(['og:title', 'twitter:title'], webpage)
or remove_end(self._html_search_regex(
r'<title[^>]*>([^<]+)</title>', webpage, 'title', fatal=False), ' | GoPro'))
if title:
title = title.replace('\n', ' ')
return {
'id': video_id,
'title': title,
'formats': formats,
'thumbnail': url_or_none(
self._html_search_meta(['og:image', 'twitter:image'], webpage)),
'timestamp': unified_timestamp(
try_get(metadata, lambda x: x['collection']['created_at'])),
'uploader_id': str_or_none(
try_get(metadata, lambda x: x['account']['nickname'])),
'duration': int_or_none(
video_info.get('source_duration')),
'artist': str_or_none(
video_info.get('music_track_artist')),
'track': str_or_none(
video_info.get('music_track_name')),
}
Loading…
Cancel
Save