[extractor/lumni] Add extractor (#6302)

Authored by: carusocr Closes #6202
author: Chris Caruso <carusochrisr@gmail.com> 2023-03-04 11:22:11 -0800
committer: GitHub <noreply@github.com> 2023-03-05 00:52:11 +0530
commit: 1f8489cccbdc6e96027ef527b88717458f0900e8 (patch)
tree: 7dba674eaf74e90737c26233eb3f862387c81397
parent: ed4cc4ea793314c50ae3f82e98248c1de1c25694 (diff)
download: hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.tar.lz
hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.tar.xz
hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.zip
2 files changed, 27 insertions, 0 deletions
diff --git a/yt_dlp/extractor/_extractors.py b/yt_dlp/extractor/_extractors.py
index 0731845ba..ccac634b3 100644
--- a/yt_dlp/extractor/_extractors.py
+++ b/yt_dlp/extractor/_extractors.py
@@ -962,6 +962,9 @@ from .lrt import (
     LRTVODIE,
     LRTStreamIE
 )
+from .lumni import (
+    LumniIE
+)
 from .lynda import (
     LyndaIE,
     LyndaCourseIE
diff --git a/yt_dlp/extractor/lumni.py b/yt_dlp/extractor/lumni.py
new file mode 100644
index 000000000..5810da0c8
--- /dev/null
+++ b/yt_dlp/extractor/lumni.py
@@ -0,0 +1,24 @@
+from .common import InfoExtractor
+from .francetv import FranceTVIE
+
+
+class LumniIE(InfoExtractor):
+    _VALID_URL = r'https?://(?:www\.)?lumni\.fr/video/(?P<id>[\w-]+)'
+    _TESTS = [{
+        'url': 'https://www.lumni.fr/video/l-homme-et-son-environnement-dans-la-revolution-industrielle',
+        'md5': '960e8240c4f2c7a20854503a71e52f5e',
+        'info_dict': {
+            'id': 'd2b9a4e5-a526-495b-866c-ab72737e3645',
+            'ext': 'mp4',
+            'title': "L'homme et son environnement dans la révolution industrielle - L'ère de l'homme",
+            'thumbnail': 'https://assets.webservices.francetelevisions.fr/v1/assets/images/a7/17/9f/a7179f5f-63a5-4e11-8d4d-012ab942d905.jpg',
+            'duration': 230,
+        }
+    }]
+
+    def _real_extract(self, url):
+        display_id = self._match_id(url)
+        webpage = self._download_webpage(url, display_id)
+        video_id = self._html_search_regex(
+            r'<div[^>]+data-factoryid\s*=\s*["\']([^"\']+)', webpage, 'video id')
+        return self.url_result(f'francetv:{video_id}', FranceTVIE, video_id)
author	Chris Caruso <carusochrisr@gmail.com>	2023-03-04 11:22:11 -0800
committer	GitHub <noreply@github.com>	2023-03-05 00:52:11 +0530
commit	1f8489cccbdc6e96027ef527b88717458f0900e8 (patch)
tree	7dba674eaf74e90737c26233eb3f862387c81397
parent	ed4cc4ea793314c50ae3f82e98248c1de1c25694 (diff)
download	hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.tar.lz hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.tar.xz hypervideo-pre-1f8489cccbdc6e96027ef527b88717458f0900e8.zip