diff options
| author | HobbyistDev <105957301+HobbyistDev@users.noreply.github.com> | 2023-02-17 11:57:52 +0900 | 
|---|---|---|
| committer | GitHub <noreply@github.com> | 2023-02-17 08:27:52 +0530 | 
| commit | 72671a212d7c939329cb5d34335fa089dd3acbd3 (patch) | |
| tree | 9cffded4eeb2c8ffa8645b9efe82ca385edafe9d | |
| parent | 376aa24b1541e2bfb23337c0ae9bafa5bb3787f1 (diff) | |
| download | hypervideo-pre-72671a212d7c939329cb5d34335fa089dd3acbd3.tar.lz hypervideo-pre-72671a212d7c939329cb5d34335fa089dd3acbd3.tar.xz hypervideo-pre-72671a212d7c939329cb5d34335fa089dd3acbd3.zip | |
[extractor/viu] Add `ViuOTTIndonesiaIE` extractor (#6099)
Authored by: HobbyistDev
Closes #1757
| -rw-r--r-- | yt_dlp/extractor/_extractors.py | 1 | ||||
| -rw-r--r-- | yt_dlp/extractor/viu.py | 146 | 
2 files changed, 147 insertions, 0 deletions
| diff --git a/yt_dlp/extractor/_extractors.py b/yt_dlp/extractor/_extractors.py index 061a25a4e..081696855 100644 --- a/yt_dlp/extractor/_extractors.py +++ b/yt_dlp/extractor/_extractors.py @@ -2181,6 +2181,7 @@ from .viu import (      ViuIE,      ViuPlaylistIE,      ViuOTTIE, +    ViuOTTIndonesiaIE,  )  from .vk import (      VKIE, diff --git a/yt_dlp/extractor/viu.py b/yt_dlp/extractor/viu.py index dd4cad7ba..6f9af9f64 100644 --- a/yt_dlp/extractor/viu.py +++ b/yt_dlp/extractor/viu.py @@ -9,9 +9,12 @@ from ..compat import compat_str  from ..utils import (      ExtractorError,      int_or_none, +    remove_end,      strip_or_none, +    traverse_obj,      try_get,      smuggle_url, +    unified_timestamp,      unsmuggle_url,      url_or_none,  ) @@ -394,3 +397,146 @@ class ViuOTTIE(InfoExtractor):              'formats': formats,              'subtitles': subtitles,          } + + +class ViuOTTIndonesiaBaseIE(InfoExtractor): +    _BASE_QUERY = { +        'ver': 1.0, +        'fmt': 'json', +        'aver': 5.0, +        'appver': 2.0, +        'appid': 'viu_desktop', +        'platform': 'desktop', +    } + +    _DEVICE_ID = str(uuid.uuid4()) +    _SESSION_ID = str(uuid.uuid4()) +    _TOKEN = None + +    _HEADERS = { +        'x-session-id': _SESSION_ID, +        'x-client': 'browser' +    } + +    _AGE_RATINGS_MAPPER = { +        'ADULTS': 18, +        'teens': 13 +    } + +    def _real_initialize(self): +        ViuOTTIndonesiaBaseIE._TOKEN = self._download_json( +            'https://um.viuapi.io/user/identity', None, +            headers={'Content-type': 'application/json', **self._HEADERS}, +            query={**self._BASE_QUERY, 'iid': self._DEVICE_ID}, +            data=json.dumps({'deviceId': self._DEVICE_ID}).encode(), +            note='Downloading token information')['token'] + + +class ViuOTTIndonesiaIE(ViuOTTIndonesiaBaseIE): +    _VALID_URL = r'https?://www\.viu\.com/ott/\w+/\w+/all/video-[\w-]+-(?P<id>\d+)' +    _TESTS = [{ +        'url': 'https://www.viu.com/ott/id/id/all/video-japanese-drama-tv_shows-detective_conan_episode_793-1165863142?containerId=playlist-26271226', +        'info_dict': { +            'id': '1165863142', +            'ext': 'mp4', +            'episode_number': 793, +            'episode': 'Episode 793', +            'title': 'Detective Conan - Episode 793', +            'duration': 1476, +            'description': 'md5:b79d55345bc1e0217ece22616267c9a5', +            'thumbnail': 'https://vuclipi-a.akamaihd.net/p/cloudinary/h_171,w_304,dpr_1.5,f_auto,c_thumb,q_auto:low/1165863189/d-1', +            'upload_date': '20210101', +            'timestamp': 1609459200, +        } +    }, { +        'url': 'https://www.viu.com/ott/id/id/all/video-korean-reality-tv_shows-entertainment_weekly_episode_1622-1118617054', +        'info_dict': { +            'id': '1118617054', +            'ext': 'mp4', +            'episode_number': 1622, +            'episode': 'Episode 1622', +            'description': 'md5:6d68ca450004020113e9bf27ad99f0f8', +            'title': 'Entertainment Weekly - Episode 1622', +            'duration': 4729, +            'thumbnail': 'https://vuclipi-a.akamaihd.net/p/cloudinary/h_171,w_304,dpr_1.5,f_auto,c_thumb,q_auto:low/1120187848/d-1', +            'timestamp': 1420070400, +            'upload_date': '20150101', +            'cast': ['Shin Hyun-joon', 'Lee Da-Hee'] +        } +    }, { +        # age-limit test +        'url': 'https://www.viu.com/ott/id/id/all/video-japanese-trailer-tv_shows-trailer_jujutsu_kaisen_ver_01-1166044219?containerId=playlist-26273140', +        'info_dict': { +            'id': '1166044219', +            'ext': 'mp4', +            'upload_date': '20200101', +            'timestamp': 1577836800, +            'title': 'Trailer \'Jujutsu Kaisen\' Ver.01', +            'duration': 92, +            'thumbnail': 'https://vuclipi-a.akamaihd.net/p/cloudinary/h_171,w_304,dpr_1.5,f_auto,c_thumb,q_auto:low/1166044240/d-1', +            'description': 'Trailer \'Jujutsu Kaisen\' Ver.01', +            'cast': ['Junya Enoki', ' Yƻichi Nakamura', ' Yuma Uchida', 'Asami Seto'], +            'age_limit': 13, +        } +    }, { +        # json ld metadata type equal to Movie instead of TVEpisodes +        'url': 'https://www.viu.com/ott/id/id/all/video-japanese-animation-movies-demon_slayer_kimetsu_no_yaiba_the_movie_mugen_train-1165892707?containerId=1675060691786', +        'info_dict': { +            'id': '1165892707', +            'ext': 'mp4', +            'timestamp': 1577836800, +            'upload_date': '20200101', +            'title': 'Demon Slayer - Kimetsu no Yaiba - The Movie: Mugen Train', +            'age_limit': 13, +            'cast': 'count:9', +            'thumbnail': 'https://vuclipi-a.akamaihd.net/p/cloudinary/h_171,w_304,dpr_1.5,f_auto,c_thumb,q_auto:low/1165895279/d-1', +            'description': 'md5:1ce9c35a3aeab384085533f746c87469', +            'duration': 7021, +        } +    }] + +    def _real_extract(self, url): +        display_id = self._match_id(url) +        webpage = self._download_webpage(url, display_id) + +        video_data = self._download_json( +            f'https://um.viuapi.io/drm/v1/content/{display_id}', display_id, data=b'', +            headers={'Authorization': ViuOTTIndonesiaBaseIE._TOKEN, **self._HEADERS, 'ccode': 'ID'}) +        formats, subtitles = self._extract_m3u8_formats_and_subtitles(video_data['playUrl'], display_id) + +        initial_state = self._search_json( +            r'window\.__INITIAL_STATE__\s*=', webpage, 'initial state', +            display_id)['content']['clipDetails'] +        for key, url in initial_state.items(): +            lang, ext = self._search_regex( +                r'^subtitle_(?P<lang>[\w-]+)_(?P<ext>\w+)$', key, 'subtitle metadata', +                default=(None, None), group=('lang', 'ext')) +            if lang and ext: +                subtitles.setdefault(lang, []).append({ +                    'ext': ext, +                    'url': url, +                }) + +                if ext == 'vtt': +                    subtitles[lang].append({ +                        'ext': 'srt', +                        'url': f'{remove_end(initial_state[key], "vtt")}srt', +                    }) + +        episode = traverse_obj(list(filter( +            lambda x: x.get('@type') in ('TVEpisode', 'Movie'), self._yield_json_ld(webpage, display_id))), 0) or {} +        return { +            'id': display_id, +            'title': (traverse_obj(initial_state, 'title', 'display_title') +                      or episode.get('name')), +            'description': initial_state.get('description') or episode.get('description'), +            'duration': initial_state.get('duration'), +            'thumbnail': traverse_obj(episode, ('image', 'url')), +            'timestamp': unified_timestamp(episode.get('dateCreated')), +            'formats': formats, +            'subtitles': subtitles, +            'episode_number': (traverse_obj(initial_state, 'episode_no', 'episodeno', expected_type=int_or_none) +                               or int_or_none(episode.get('episodeNumber'))), +            'cast': traverse_obj(episode, ('actor', ..., 'name'), default=None), +            'age_limit': self._AGE_RATINGS_MAPPER.get(initial_state.get('internal_age_rating')) +        } | 
