diff options
Diffstat (limited to 'youtube_dl/extractor/srgssr.py')
-rw-r--r-- | youtube_dl/extractor/srgssr.py | 252 |
1 files changed, 0 insertions, 252 deletions
diff --git a/youtube_dl/extractor/srgssr.py b/youtube_dl/extractor/srgssr.py deleted file mode 100644 index ac018e740..000000000 --- a/youtube_dl/extractor/srgssr.py +++ /dev/null @@ -1,252 +0,0 @@ -# coding: utf-8 -from __future__ import unicode_literals - -import re - -from .common import InfoExtractor -from ..utils import ( - ExtractorError, - float_or_none, - int_or_none, - parse_iso8601, - qualities, - try_get, -) - - -class SRGSSRIE(InfoExtractor): - _VALID_URL = r'''(?x) - (?: - https?://tp\.srgssr\.ch/p(?:/[^/]+)+\?urn=urn| - srgssr - ): - (?P<bu> - srf|rts|rsi|rtr|swi - ):(?:[^:]+:)? - (?P<type> - video|audio - ): - (?P<id> - [0-9a-f\-]{36}|\d+ - ) - ''' - _GEO_BYPASS = False - _GEO_COUNTRIES = ['CH'] - - _ERRORS = { - 'AGERATING12': 'To protect children under the age of 12, this video is only available between 8 p.m. and 6 a.m.', - 'AGERATING18': 'To protect children under the age of 18, this video is only available between 11 p.m. and 5 a.m.', - # 'ENDDATE': 'For legal reasons, this video was only available for a specified period of time.', - 'GEOBLOCK': 'For legal reasons, this video is only available in Switzerland.', - 'LEGAL': 'The video cannot be transmitted for legal reasons.', - 'STARTDATE': 'This video is not yet available. Please try again later.', - } - _DEFAULT_LANGUAGE_CODES = { - 'srf': 'de', - 'rts': 'fr', - 'rsi': 'it', - 'rtr': 'rm', - 'swi': 'en', - } - - def _get_tokenized_src(self, url, video_id, format_id): - token = self._download_json( - 'http://tp.srgssr.ch/akahd/token?acl=*', - video_id, 'Downloading %s token' % format_id, fatal=False) or {} - auth_params = try_get(token, lambda x: x['token']['authparams']) - if auth_params: - url += ('?' if '?' not in url else '&') + auth_params - return url - - def _get_media_data(self, bu, media_type, media_id): - query = {'onlyChapters': True} if media_type == 'video' else {} - full_media_data = self._download_json( - 'https://il.srgssr.ch/integrationlayer/2.0/%s/mediaComposition/%s/%s.json' - % (bu, media_type, media_id), - media_id, query=query)['chapterList'] - try: - media_data = next( - x for x in full_media_data if x.get('id') == media_id) - except StopIteration: - raise ExtractorError('No media information found') - - block_reason = media_data.get('blockReason') - if block_reason and block_reason in self._ERRORS: - message = self._ERRORS[block_reason] - if block_reason == 'GEOBLOCK': - self.raise_geo_restricted( - msg=message, countries=self._GEO_COUNTRIES) - raise ExtractorError( - '%s said: %s' % (self.IE_NAME, message), expected=True) - - return media_data - - def _real_extract(self, url): - bu, media_type, media_id = re.match(self._VALID_URL, url).groups() - media_data = self._get_media_data(bu, media_type, media_id) - title = media_data['title'] - - formats = [] - q = qualities(['SD', 'HD']) - for source in (media_data.get('resourceList') or []): - format_url = source.get('url') - if not format_url: - continue - protocol = source.get('protocol') - quality = source.get('quality') - format_id = [] - for e in (protocol, source.get('encoding'), quality): - if e: - format_id.append(e) - format_id = '-'.join(format_id) - - if protocol in ('HDS', 'HLS'): - if source.get('tokenType') == 'AKAMAI': - format_url = self._get_tokenized_src( - format_url, media_id, format_id) - formats.extend(self._extract_akamai_formats( - format_url, media_id)) - elif protocol == 'HLS': - formats.extend(self._extract_m3u8_formats( - format_url, media_id, 'mp4', 'm3u8_native', - m3u8_id=format_id, fatal=False)) - elif protocol in ('HTTP', 'HTTPS'): - formats.append({ - 'format_id': format_id, - 'url': format_url, - 'quality': q(quality), - }) - - # This is needed because for audio medias the podcast url is usually - # always included, even if is only an audio segment and not the - # whole episode. - if int_or_none(media_data.get('position')) == 0: - for p in ('S', 'H'): - podcast_url = media_data.get('podcast%sdUrl' % p) - if not podcast_url: - continue - quality = p + 'D' - formats.append({ - 'format_id': 'PODCAST-' + quality, - 'url': podcast_url, - 'quality': q(quality), - }) - self._sort_formats(formats) - - subtitles = {} - if media_type == 'video': - for sub in (media_data.get('subtitleList') or []): - sub_url = sub.get('url') - if not sub_url: - continue - lang = sub.get('locale') or self._DEFAULT_LANGUAGE_CODES[bu] - subtitles.setdefault(lang, []).append({ - 'url': sub_url, - }) - - return { - 'id': media_id, - 'title': title, - 'description': media_data.get('description'), - 'timestamp': parse_iso8601(media_data.get('date')), - 'thumbnail': media_data.get('imageUrl'), - 'duration': float_or_none(media_data.get('duration'), 1000), - 'subtitles': subtitles, - 'formats': formats, - } - - -class SRGSSRPlayIE(InfoExtractor): - IE_DESC = 'srf.ch, rts.ch, rsi.ch, rtr.ch and swissinfo.ch play sites' - _VALID_URL = r'''(?x) - https?:// - (?:(?:www|play)\.)? - (?P<bu>srf|rts|rsi|rtr|swissinfo)\.ch/play/(?:tv|radio)/ - (?: - [^/]+/(?P<type>video|audio)/[^?]+| - popup(?P<type_2>video|audio)player - ) - \?.*?\b(?:id=|urn=urn:[^:]+:video:)(?P<id>[0-9a-f\-]{36}|\d+) - ''' - - _TESTS = [{ - 'url': 'http://www.srf.ch/play/tv/10vor10/video/snowden-beantragt-asyl-in-russland?id=28e1a57d-5b76-4399-8ab3-9097f071e6c5', - 'md5': '6db2226ba97f62ad42ce09783680046c', - 'info_dict': { - 'id': '28e1a57d-5b76-4399-8ab3-9097f071e6c5', - 'ext': 'mp4', - 'upload_date': '20130701', - 'title': 'Snowden beantragt Asyl in Russland', - 'timestamp': 1372708215, - 'duration': 113.827, - 'thumbnail': r're:^https?://.*1383719781\.png$', - }, - 'expected_warnings': ['Unable to download f4m manifest'], - }, { - 'url': 'http://www.rtr.ch/play/radio/actualitad/audio/saira-tujetsch-tuttina-cuntinuar-cun-sedrun-muster-turissem?id=63cb0778-27f8-49af-9284-8c7a8c6d15fc', - 'info_dict': { - 'id': '63cb0778-27f8-49af-9284-8c7a8c6d15fc', - 'ext': 'mp3', - 'upload_date': '20151013', - 'title': 'Saira: Tujetsch - tuttina cuntinuar cun Sedrun Mustér Turissem', - 'timestamp': 1444709160, - 'duration': 336.816, - }, - 'params': { - # rtmp download - 'skip_download': True, - }, - }, { - 'url': 'http://www.rts.ch/play/tv/-/video/le-19h30?id=6348260', - 'md5': '67a2a9ae4e8e62a68d0e9820cc9782df', - 'info_dict': { - 'id': '6348260', - 'display_id': '6348260', - 'ext': 'mp4', - 'duration': 1796.76, - 'title': 'Le 19h30', - 'upload_date': '20141201', - 'timestamp': 1417458600, - 'thumbnail': r're:^https?://.*\.image', - }, - 'params': { - # m3u8 download - 'skip_download': True, - } - }, { - 'url': 'http://play.swissinfo.ch/play/tv/business/video/why-people-were-against-tax-reforms?id=42960270', - 'info_dict': { - 'id': '42960270', - 'ext': 'mp4', - 'title': 'Why people were against tax reforms', - 'description': 'md5:7ac442c558e9630e947427469c4b824d', - 'duration': 94.0, - 'upload_date': '20170215', - 'timestamp': 1487173560, - 'thumbnail': r're:https?://www\.swissinfo\.ch/srgscalableimage/42961964', - 'subtitles': 'count:9', - }, - 'params': { - 'skip_download': True, - } - }, { - 'url': 'https://www.srf.ch/play/tv/popupvideoplayer?id=c4dba0ca-e75b-43b2-a34f-f708a4932e01', - 'only_matching': True, - }, { - 'url': 'https://www.srf.ch/play/tv/10vor10/video/snowden-beantragt-asyl-in-russland?urn=urn:srf:video:28e1a57d-5b76-4399-8ab3-9097f071e6c5', - 'only_matching': True, - }, { - 'url': 'https://www.rts.ch/play/tv/19h30/video/le-19h30?urn=urn:rts:video:6348260', - 'only_matching': True, - }, { - # audio segment, has podcastSdUrl of the full episode - 'url': 'https://www.srf.ch/play/radio/popupaudioplayer?id=50b20dc8-f05b-4972-bf03-e438ff2833eb', - 'only_matching': True, - }] - - def _real_extract(self, url): - mobj = re.match(self._VALID_URL, url) - bu = mobj.group('bu') - media_type = mobj.group('type') or mobj.group('type_2') - media_id = mobj.group('id') - return self.url_result('srgssr:%s:%s:%s' % (bu[:3], media_type, media_id), 'SRGSSR') |