aboutsummaryrefslogtreecommitdiffstats
path: root/hypervideo_dl/extractor/medaltv.py
diff options
context:
space:
mode:
Diffstat (limited to 'hypervideo_dl/extractor/medaltv.py')
-rw-r--r--hypervideo_dl/extractor/medaltv.py77
1 files changed, 56 insertions, 21 deletions
diff --git a/hypervideo_dl/extractor/medaltv.py b/hypervideo_dl/extractor/medaltv.py
index 59cc307..82be823 100644
--- a/hypervideo_dl/extractor/medaltv.py
+++ b/hypervideo_dl/extractor/medaltv.py
@@ -1,6 +1,3 @@
-# coding: utf-8
-from __future__ import unicode_literals
-
import re
from .common import InfoExtractor
@@ -11,15 +8,33 @@ from ..utils import (
float_or_none,
int_or_none,
str_or_none,
- try_get,
+ traverse_obj,
)
class MedalTVIE(InfoExtractor):
- _VALID_URL = r'https?://(?:www\.)?medal\.tv/clips/(?P<id>[^/?#&]+)'
+ _VALID_URL = r'https?://(?:www\.)?medal\.tv/(?P<path>games/[^/?#&]+/clips)/(?P<id>[^/?#&]+)'
_TESTS = [{
- 'url': 'https://medal.tv/clips/2mA60jWAGQCBH',
- 'md5': '7b07b064331b1cf9e8e5c52a06ae68fa',
+ 'url': 'https://medal.tv/games/valorant/clips/jTBFnLKdLy15K',
+ 'md5': '6930f8972914b6b9fdc2bb3918098ba0',
+ 'info_dict': {
+ 'id': 'jTBFnLKdLy15K',
+ 'ext': 'mp4',
+ 'title': "Mornu's clutch",
+ 'description': '',
+ 'uploader': 'Aciel',
+ 'timestamp': 1651628243,
+ 'upload_date': '20220504',
+ 'uploader_id': '19335460',
+ 'uploader_url': 'https://medal.tv/users/19335460',
+ 'comment_count': int,
+ 'view_count': int,
+ 'like_count': int,
+ 'duration': 13,
+ }
+ }, {
+ 'url': 'https://medal.tv/games/cod%20cold%20war/clips/2mA60jWAGQCBH',
+ 'md5': '3d19d426fe0b2d91c26e412684e66a06',
'info_dict': {
'id': '2mA60jWAGQCBH',
'ext': 'mp4',
@@ -29,9 +44,15 @@ class MedalTVIE(InfoExtractor):
'timestamp': 1603165266,
'upload_date': '20201020',
'uploader_id': '10619174',
+ 'thumbnail': 'https://cdn.medal.tv/10619174/thumbnail-34934644-720p.jpg?t=1080p&c=202042&missing',
+ 'uploader_url': 'https://medal.tv/users/10619174',
+ 'comment_count': int,
+ 'view_count': int,
+ 'like_count': int,
+ 'duration': 23,
}
}, {
- 'url': 'https://medal.tv/clips/2um24TWdty0NA',
+ 'url': 'https://medal.tv/games/cod%20cold%20war/clips/2um24TWdty0NA',
'md5': 'b6dc76b78195fff0b4f8bf4a33ec2148',
'info_dict': {
'id': '2um24TWdty0NA',
@@ -42,25 +63,42 @@ class MedalTVIE(InfoExtractor):
'timestamp': 1605580939,
'upload_date': '20201117',
'uploader_id': '5156321',
+ 'thumbnail': 'https://cdn.medal.tv/5156321/thumbnail-36787208-360p.jpg?t=1080p&c=202046&missing',
+ 'uploader_url': 'https://medal.tv/users/5156321',
+ 'comment_count': int,
+ 'view_count': int,
+ 'like_count': int,
+ 'duration': 9,
}
}, {
- 'url': 'https://medal.tv/clips/37rMeFpryCC-9',
+ 'url': 'https://medal.tv/games/valorant/clips/37rMeFpryCC-9',
'only_matching': True,
}, {
- 'url': 'https://medal.tv/clips/2WRj40tpY_EU9',
+ 'url': 'https://medal.tv/games/valorant/clips/2WRj40tpY_EU9',
'only_matching': True,
}]
def _real_extract(self, url):
video_id = self._match_id(url)
+ path = self._match_valid_url(url).group('path')
+
webpage = self._download_webpage(url, video_id)
- hydration_data = self._parse_json(self._search_regex(
- r'<script[^>]*>\s*(?:var\s*)?hydrationData\s*=\s*({.+?})\s*</script>',
- webpage, 'hydration data', default='{}'), video_id)
+ next_data = self._search_json(
+ '<script[^>]*__NEXT_DATA__[^>]*>', webpage,
+ 'next data', video_id, end_pattern='</script>', fatal=False)
- clip = try_get(
- hydration_data, lambda x: x['clips'][video_id], dict) or {}
+ build_id = next_data.get('buildId')
+ if not build_id:
+ raise ExtractorError(
+ 'Could not find build ID.', video_id=video_id)
+
+ locale = next_data.get('locale', 'en')
+
+ api_response = self._download_json(
+ f'https://medal.tv/_next/data/{build_id}/{locale}/{path}/{video_id}.json', video_id)
+
+ clip = traverse_obj(api_response, ('pageProps', 'clip')) or {}
if not clip:
raise ExtractorError(
'Could not find video information.', video_id=video_id)
@@ -112,14 +150,11 @@ class MedalTVIE(InfoExtractor):
'An unknown error occurred ({0}).'.format(error),
video_id=video_id)
- self._sort_formats(formats)
-
# Necessary because the id of the author is not known in advance.
# Won't raise an issue if no profile can be found as this is optional.
- author = try_get(
- hydration_data, lambda x: list(x['profiles'].values())[0], dict) or {}
- author_id = str_or_none(author.get('id'))
- author_url = format_field(author_id, template='https://medal.tv/users/%s')
+ author = traverse_obj(api_response, ('pageProps', 'profile')) or {}
+ author_id = str_or_none(author.get('userId'))
+ author_url = format_field(author_id, None, 'https://medal.tv/users/%s')
return {
'id': video_id,