diff options
author | Grabien <60237587+Grabien@users.noreply.github.com> | 2021-11-26 21:00:04 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-11-27 00:30:04 +0530 |
commit | 18d6dd4e0194211c4f3238fe441ebe0c1fdbc167 (patch) | |
tree | 1448627be1eda3681f57c7f02c43977d81d45e5b | |
parent | 883ecd54949fa90174094628bf002f179edf6767 (diff) | |
download | hypervideo-pre-18d6dd4e0194211c4f3238fe441ebe0c1fdbc167.tar.lz hypervideo-pre-18d6dd4e0194211c4f3238fe441ebe0c1fdbc167.tar.xz hypervideo-pre-18d6dd4e0194211c4f3238fe441ebe0c1fdbc167.zip |
[extractor/breitbart] Breitbart.com website support (#1434)
Authored by: Grabien
-rw-r--r-- | yt_dlp/extractor/breitbart.py | 39 | ||||
-rw-r--r-- | yt_dlp/extractor/extractors.py | 1 |
2 files changed, 40 insertions, 0 deletions
diff --git a/yt_dlp/extractor/breitbart.py b/yt_dlp/extractor/breitbart.py new file mode 100644 index 000000000..f50f719dc --- /dev/null +++ b/yt_dlp/extractor/breitbart.py @@ -0,0 +1,39 @@ +from __future__ import unicode_literals + +from .common import InfoExtractor + + +class BreitBartIE(InfoExtractor): + _VALID_URL = r'https?:\/\/(?:www\.)breitbart.com/videos/v/(?P<id>[^/]+)' + _TESTS = [{ + 'url': 'https://www.breitbart.com/videos/v/5cOz1yup/?pl=Ij6NDOji', + 'md5': '0aa6d1d6e183ac5ca09207fe49f17ade', + 'info_dict': { + 'id': '5cOz1yup', + 'ext': 'mp4', + 'title': 'Watch \u2013 Clyburn: Statues in Congress Have to Go Because they Are Honoring Slavery', + 'description': 'md5:bac35eb0256d1cb17f517f54c79404d5', + 'thumbnail': 'https://cdn.jwplayer.com/thumbs/5cOz1yup-1920.jpg', + 'age_limit': 0, + } + }, { + 'url': 'https://www.breitbart.com/videos/v/eaiZjVOn/', + 'only_matching': True, + }] + + def _real_extract(self, url): + video_id = self._match_id(url) + webpage = self._download_webpage(url, video_id) + + formats = self._extract_m3u8_formats(f'https://cdn.jwplayer.com/manifests/{video_id}.m3u8', video_id, ext='mp4') + self._sort_formats(formats) + return { + 'id': video_id, + 'title': self._og_search_title( + webpage, default=None) or self._html_search_regex( + r'(?s)<title>(.*?)</title>', webpage, 'video title'), + 'description': self._og_search_description(webpage), + 'thumbnail': self._og_search_thumbnail(webpage), + 'age_limit': self._rta_search(webpage), + 'formats': formats + } diff --git a/yt_dlp/extractor/extractors.py b/yt_dlp/extractor/extractors.py index 163efc748..ed8a23e72 100644 --- a/yt_dlp/extractor/extractors.py +++ b/yt_dlp/extractor/extractors.py @@ -179,6 +179,7 @@ from .br import ( ) from .bravotv import BravoTVIE from .breakcom import BreakIE +from .breitbart import BreitBartIE from .brightcove import ( BrightcoveLegacyIE, BrightcoveNewIE, |