diff options
author | sqrtNOT <77981959+sqrtNOT@users.noreply.github.com> | 2022-07-17 10:34:33 +0000 |
---|---|---|
committer | GitHub <noreply@github.com> | 2022-07-17 16:04:33 +0530 |
commit | 129dfa5f459f065d8be6205acda3a024127a894f (patch) | |
tree | 6e23ef70fd872cca6fd663f6168aeb4a2ac5db5c /yt_dlp/extractor/wsj.py | |
parent | 3df6a603e4753f08bc44cdbbb45832970466f436 (diff) | |
download | hypervideo-pre-129dfa5f459f065d8be6205acda3a024127a894f.tar.lz hypervideo-pre-129dfa5f459f065d8be6205acda3a024127a894f.tar.xz hypervideo-pre-129dfa5f459f065d8be6205acda3a024127a894f.zip |
[extractor/WSJArticle] Fix video id extraction (#4268)
Closes #4249
Authored by: sqrtNOT
Diffstat (limited to 'yt_dlp/extractor/wsj.py')
-rw-r--r-- | yt_dlp/extractor/wsj.py | 3 |
1 files changed, 2 insertions, 1 deletions
diff --git a/yt_dlp/extractor/wsj.py b/yt_dlp/extractor/wsj.py index 8be3645e3..9eeed104f 100644 --- a/yt_dlp/extractor/wsj.py +++ b/yt_dlp/extractor/wsj.py @@ -116,5 +116,6 @@ class WSJArticleIE(InfoExtractor): article_id = self._match_id(url) webpage = self._download_webpage(url, article_id) video_id = self._search_regex( - r'data-src=["\']([a-fA-F0-9-]{36})', webpage, 'video id') + r'(?:id=["\']video|video-|iframe\.html\?guid=|data-src=["\'])([a-fA-F0-9-]{36})', + webpage, 'video id') return self.url_result('wsj:%s' % video_id, WSJIE.ie_key(), video_id) |