diff options
author | Jesús <heckyel@hyperbola.info> | 2021-10-18 15:24:21 -0500 |
---|---|---|
committer | Jesús <heckyel@hyperbola.info> | 2021-10-18 15:24:21 -0500 |
commit | 5122028a4bcac4ae577ef7fbd55ccad5cb34ef5e (patch) | |
tree | 65209bc739db35e31f1c9b5b868eb5df4fe12ae3 /hypervideo_dl/extractor/mildom.py | |
parent | 27fe903c511691c078942bef5ee9a05a43b15c8f (diff) | |
download | hypervideo-5122028a4bcac4ae577ef7fbd55ccad5cb34ef5e.tar.lz hypervideo-5122028a4bcac4ae577ef7fbd55ccad5cb34ef5e.tar.xz hypervideo-5122028a4bcac4ae577ef7fbd55ccad5cb34ef5e.zip |
update from upstream
Diffstat (limited to 'hypervideo_dl/extractor/mildom.py')
-rw-r--r-- | hypervideo_dl/extractor/mildom.py | 258 |
1 files changed, 258 insertions, 0 deletions
diff --git a/hypervideo_dl/extractor/mildom.py b/hypervideo_dl/extractor/mildom.py new file mode 100644 index 0000000..c147cbb --- /dev/null +++ b/hypervideo_dl/extractor/mildom.py @@ -0,0 +1,258 @@ +# coding: utf-8 +from __future__ import unicode_literals + +import base64 +from datetime import datetime +import itertools +import json + +from .common import InfoExtractor +from ..utils import ( + std_headers, + update_url_query, + random_uuidv4, + try_get, +) +from ..compat import ( + compat_str, +) + + +class MildomBaseIE(InfoExtractor): + _GUEST_ID = None + _DISPATCHER_CONFIG = None + + def _call_api(self, url, video_id, query={}, note='Downloading JSON metadata', init=False): + url = update_url_query(url, self._common_queries(query, init=init)) + return self._download_json(url, video_id, note=note)['body'] + + def _common_queries(self, query={}, init=False): + dc = self._fetch_dispatcher_config() + r = { + 'timestamp': self.iso_timestamp(), + '__guest_id': '' if init else self.guest_id(), + '__location': dc['location'], + '__country': dc['country'], + '__cluster': dc['cluster'], + '__platform': 'web', + '__la': self.lang_code(), + '__pcv': 'v2.9.44', + 'sfr': 'pc', + 'accessToken': '', + } + r.update(query) + return r + + def _fetch_dispatcher_config(self): + if not self._DISPATCHER_CONFIG: + tmp = self._download_json( + 'https://disp.mildom.com/serverListV2', 'initialization', + note='Downloading dispatcher_config', data=json.dumps({ + 'protover': 0, + 'data': base64.b64encode(json.dumps({ + 'fr': 'web', + 'sfr': 'pc', + 'devi': 'Windows', + 'la': 'ja', + 'gid': None, + 'loc': '', + 'clu': '', + 'wh': '1919*810', + 'rtm': self.iso_timestamp(), + 'ua': std_headers['User-Agent'], + }).encode('utf8')).decode('utf8').replace('\n', ''), + }).encode('utf8')) + self._DISPATCHER_CONFIG = self._parse_json(base64.b64decode(tmp['data']), 'initialization') + return self._DISPATCHER_CONFIG + + @staticmethod + def iso_timestamp(): + 'new Date().toISOString()' + return datetime.utcnow().isoformat()[0:-3] + 'Z' + + def guest_id(self): + 'getGuestId' + if self._GUEST_ID: + return self._GUEST_ID + self._GUEST_ID = try_get( + self, ( + lambda x: x._call_api( + 'https://cloudac.mildom.com/nonolive/gappserv/guest/h5init', 'initialization', + note='Downloading guest token', init=True)['guest_id'] or None, + lambda x: x._get_cookies('https://www.mildom.com').get('gid').value, + lambda x: x._get_cookies('https://m.mildom.com').get('gid').value, + ), compat_str) or '' + return self._GUEST_ID + + def lang_code(self): + 'getCurrentLangCode' + return 'ja' + + +class MildomIE(MildomBaseIE): + IE_NAME = 'mildom' + IE_DESC = 'Record ongoing live by specific user in Mildom' + _VALID_URL = r'https?://(?:(?:www|m)\.)mildom\.com/(?P<id>\d+)' + + def _real_extract(self, url): + video_id = self._match_id(url) + url = 'https://www.mildom.com/%s' % video_id + + webpage = self._download_webpage(url, video_id) + + enterstudio = self._call_api( + 'https://cloudac.mildom.com/nonolive/gappserv/live/enterstudio', video_id, + note='Downloading live metadata', query={'user_id': video_id}) + result_video_id = enterstudio.get('log_id', video_id) + + title = try_get( + enterstudio, ( + lambda x: self._html_search_meta('twitter:description', webpage), + lambda x: x['anchor_intro'], + ), compat_str) + description = try_get( + enterstudio, ( + lambda x: x['intro'], + lambda x: x['live_intro'], + ), compat_str) + uploader = try_get( + enterstudio, ( + lambda x: self._html_search_meta('twitter:title', webpage), + lambda x: x['loginname'], + ), compat_str) + + servers = self._call_api( + 'https://cloudac.mildom.com/nonolive/gappserv/live/liveserver', result_video_id, + note='Downloading live server list', query={ + 'user_id': video_id, + 'live_server_type': 'hls', + }) + + stream_query = self._common_queries({ + 'streamReqId': random_uuidv4(), + 'is_lhls': '0', + }) + m3u8_url = update_url_query(servers['stream_server'] + '/%s_master.m3u8' % video_id, stream_query) + formats = self._extract_m3u8_formats(m3u8_url, result_video_id, 'mp4', headers={ + 'Referer': 'https://www.mildom.com/', + 'Origin': 'https://www.mildom.com', + }, note='Downloading m3u8 information') + + del stream_query['streamReqId'], stream_query['timestamp'] + for fmt in formats: + fmt.setdefault('http_headers', {})['Referer'] = 'https://www.mildom.com/' + + self._sort_formats(formats) + + return { + 'id': result_video_id, + 'title': title, + 'description': description, + 'uploader': uploader, + 'uploader_id': video_id, + 'formats': formats, + 'is_live': True, + } + + +class MildomVodIE(MildomBaseIE): + IE_NAME = 'mildom:vod' + IE_DESC = 'Download a VOD in Mildom' + _VALID_URL = r'https?://(?:(?:www|m)\.)mildom\.com/playback/(?P<user_id>\d+)/(?P<id>(?P=user_id)-[a-zA-Z0-9]+)' + + def _real_extract(self, url): + m = self._match_valid_url(url) + user_id, video_id = m.group('user_id'), m.group('id') + url = 'https://www.mildom.com/playback/%s/%s' % (user_id, video_id) + + webpage = self._download_webpage(url, video_id) + + autoplay = self._call_api( + 'https://cloudac.mildom.com/nonolive/videocontent/playback/getPlaybackDetail', video_id, + note='Downloading playback metadata', query={ + 'v_id': video_id, + })['playback'] + + title = try_get( + autoplay, ( + lambda x: self._html_search_meta('og:description', webpage), + lambda x: x['title'], + ), compat_str) + description = try_get( + autoplay, ( + lambda x: x['video_intro'], + ), compat_str) + uploader = try_get( + autoplay, ( + lambda x: x['author_info']['login_name'], + ), compat_str) + + formats = [{ + 'url': autoplay['audio_url'], + 'format_id': 'audio', + 'protocol': 'm3u8_native', + 'vcodec': 'none', + 'acodec': 'aac', + 'ext': 'm4a' + }] + for fmt in autoplay['video_link']: + formats.append({ + 'format_id': 'video-%s' % fmt['name'], + 'url': fmt['url'], + 'protocol': 'm3u8_native', + 'width': fmt['level'] * autoplay['video_width'] // autoplay['video_height'], + 'height': fmt['level'], + 'vcodec': 'h264', + 'acodec': 'aac', + 'ext': 'mp4' + }) + + self._sort_formats(formats) + + return { + 'id': video_id, + 'title': title, + 'description': description, + 'uploader': uploader, + 'uploader_id': user_id, + 'formats': formats, + } + + +class MildomUserVodIE(MildomBaseIE): + IE_NAME = 'mildom:user:vod' + IE_DESC = 'Download all VODs from specific user in Mildom' + _VALID_URL = r'https?://(?:(?:www|m)\.)mildom\.com/profile/(?P<id>\d+)' + _TESTS = [{ + 'url': 'https://www.mildom.com/profile/10093333', + 'info_dict': { + 'id': '10093333', + 'title': 'Uploads from ねこばたけ', + }, + 'playlist_mincount': 351, + }] + + def _entries(self, user_id): + for page in itertools.count(1): + reply = self._call_api( + 'https://cloudac.mildom.com/nonolive/videocontent/profile/playbackList', + user_id, note='Downloading page %d' % page, query={ + 'user_id': user_id, + 'page': page, + 'limit': '30', + }) + if not reply: + break + for x in reply: + yield self.url_result('https://www.mildom.com/playback/%s/%s' % (user_id, x['v_id'])) + + def _real_extract(self, url): + user_id = self._match_id(url) + self.to_screen('This will download all VODs belonging to user. To download ongoing live video, use "https://www.mildom.com/%s" instead' % user_id) + + profile = self._call_api( + 'https://cloudac.mildom.com/nonolive/gappserv/user/profileV2', user_id, + query={'user_id': user_id}, note='Downloading user profile')['user_info'] + + return self.playlist_result( + self._entries(user_id), user_id, 'Uploads from %s' % profile['loginname']) |