aboutsummaryrefslogtreecommitdiffstats
path: root/hypervideo_dl/extractor/telegram.py
diff options
context:
space:
mode:
authorJesús <heckyel@hyperbola.info>2022-04-06 03:37:17 +0800
committerJesús <heckyel@hyperbola.info>2022-04-06 03:37:17 +0800
commit1e5a50b71d8f0eae6007bedc329eecb24bb5aba3 (patch)
treea8611cda6596391cb6fb645e1469dcd356b63924 /hypervideo_dl/extractor/telegram.py
parentf52fb3bceeb9d22b5106c1796fecec474a0cc138 (diff)
downloadhypervideo-1e5a50b71d8f0eae6007bedc329eecb24bb5aba3.tar.lz
hypervideo-1e5a50b71d8f0eae6007bedc329eecb24bb5aba3.tar.xz
hypervideo-1e5a50b71d8f0eae6007bedc329eecb24bb5aba3.zip
update from upstream
Diffstat (limited to 'hypervideo_dl/extractor/telegram.py')
-rw-r--r--hypervideo_dl/extractor/telegram.py37
1 files changed, 37 insertions, 0 deletions
diff --git a/hypervideo_dl/extractor/telegram.py b/hypervideo_dl/extractor/telegram.py
new file mode 100644
index 0000000..2dfa261
--- /dev/null
+++ b/hypervideo_dl/extractor/telegram.py
@@ -0,0 +1,37 @@
+from .common import InfoExtractor
+
+
+class TelegramEmbedIE(InfoExtractor):
+ IE_NAME = 'telegram:embed'
+ _VALID_URL = r'https?://t\.me/(?P<channel_name>[^/]+)/(?P<id>\d+)'
+ _TESTS = [{
+ 'url': 'https://t.me/europa_press/613',
+ 'info_dict': {
+ 'id': '613',
+ 'ext': 'mp4',
+ 'title': 'Europa Press',
+ 'description': '6ce2d7e8d56eda16d80607b23db7b252',
+ 'thumbnail': r're:^https?:\/\/cdn.*?telesco\.pe\/file\/\w+',
+ },
+ }]
+
+ def _real_extract(self, url):
+ video_id = self._match_id(url)
+ webpage = self._download_webpage(url, video_id)
+ webpage_embed = self._download_webpage(f'{url}?embed=1', video_id)
+
+ formats = [{
+ 'url': self._proto_relative_url(self._search_regex(
+ '<video[^>]+src="([^"]+)"', webpage_embed, 'source')),
+ 'ext': 'mp4',
+ }]
+ self._sort_formats(formats)
+
+ return {
+ 'id': video_id,
+ 'title': self._html_search_meta(['og:title', 'twitter:title'], webpage, fatal=True),
+ 'description': self._html_search_meta(['og:description', 'twitter:description'], webpage, fatal=True),
+ 'thumbnail': self._search_regex(r'tgme_widget_message_video_thumb"[^>]+background-image:url\(\'([^\']+)\'\)',
+ webpage_embed, 'thumbnail'),
+ 'formats': formats,
+ }