[instagram] Fix extractor

author: The Hatsune Daishi <nao20010128@gmail.com> 2020-11-06 15:15:07 +0900
committer: GitHub <noreply@github.com> 2020-11-06 15:15:07 +0900
commit: 987d2e079ad0fd45df19b6183d38f83bcd528e9d (patch)
tree: 69ae3716260eae4d03691b73a7b298cc6211f37f
parent: adb118da2667522babf2b849a7ad1f5c44b8873b (diff)
download: hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.tar.lz
hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.tar.xz
hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.zip
1 files changed, 14 insertions, 7 deletions
diff --git a/youtube_dlc/extractor/instagram.py b/youtube_dlc/extractor/instagram.py
index b061850a1..bbfe23c76 100644
--- a/youtube_dlc/extractor/instagram.py
+++ b/youtube_dlc/extractor/instagram.py
@@ -126,16 +126,23 @@ class InstagramIE(InfoExtractor):
          uploader_id, like_count, comment_count, comments, height,
          width) = [None] * 11
 
-        shared_data = self._parse_json(
-            self._search_regex(
-                r'window\._sharedData\s*=\s*({.+?});',
-                webpage, 'shared data', default='{}'),
-            video_id, fatal=False)
+        shared_data = try_get(webpage,
+                              (lambda x: self._parse_json(
+                                  self._search_regex(
+                                      r'window\.__additionalDataLoaded\(\'/(?:p|tv)/(?:[^/?#&]+)/\',({.+?})\);',
+                                      x, 'additional data', default='{}'),
+                                  video_id, fatal=False),
+                               lambda x: self._parse_json(
+                                  self._search_regex(
+                                      r'window\._sharedData\s*=\s*({.+?});',
+                                      x, 'shared data', default='{}'),
+                                  video_id, fatal=False)['entry_data']['PostPage'][0]),
+                              None)
         if shared_data:
             media = try_get(
                 shared_data,
-                (lambda x: x['entry_data']['PostPage'][0]['graphql']['shortcode_media'],
-                 lambda x: x['entry_data']['PostPage'][0]['media']),
+                (lambda x: x['graphql']['shortcode_media'],
+                 lambda x: x['media']),
                 dict)
             if media:
                 video_url = media.get('video_url')
author	The Hatsune Daishi <nao20010128@gmail.com>	2020-11-06 15:15:07 +0900
committer	GitHub <noreply@github.com>	2020-11-06 15:15:07 +0900
commit	987d2e079ad0fd45df19b6183d38f83bcd528e9d (patch)
tree	69ae3716260eae4d03691b73a7b298cc6211f37f
parent	adb118da2667522babf2b849a7ad1f5c44b8873b (diff)
download	hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.tar.lz hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.tar.xz hypervideo-pre-987d2e079ad0fd45df19b6183d38f83bcd528e9d.zip