Include fix for rg3/youtube-dl#18052 (no view count)

author: James Taylor <user234683@users.noreply.github.com> 2018-11-05 01:29:50 -0800
committer: James Taylor <user234683@users.noreply.github.com> 2018-11-05 01:29:50 -0800
commit: 4b9e9529bed5c8366f8ba67db8fae27cf335b852 (patch)
tree: 637bd4df6fd3648065de34efc4c106d805b7e58c
parent: 8784070e75685086b2c1db2973e2082743da6296 (diff)
download: yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.tar.lz
yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.tar.xz
yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.zip
1 files changed, 31 insertions, 1 deletions
diff --git a/youtube_dl/extractor/youtube.py b/youtube_dl/extractor/youtube.py
index 85c90dc..544cfb6 100644
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -42,6 +42,7 @@ from ..utils import (
     remove_quotes,
     remove_start,
     smuggle_url,
+    str_or_none,
     str_to_int,
     try_get,
     unescapeHTML,
@@ -1532,6 +1533,9 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
 
         def extract_view_count(v_info):
             return int_or_none(try_get(v_info, lambda x: x['view_count'][0]))
+
+        player_response = {}
+
         # Is it unlisted?
         unlisted = (self._search_regex('''<meta itemprop="unlisted" content="(\w*)">''', video_webpage, 'is_unlisted', default='False') == "True")
 
@@ -1629,6 +1633,12 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                 if args.get('livestream') == '1' or args.get('live_playback') == 1:
                     is_live = True
                 sts = ytplayer_config.get('sts')
+                if not player_response:
+                    pl_response = str_or_none(args.get('player_response'))
+                    if pl_response:
+                        pl_response = self._parse_json(pl_response, video_id, fatal=False)
+                        if isinstance(pl_response, dict):
+                            player_response = pl_response
             if not video_info or self._downloader.params.get('youtube_include_dash_manifest', True):
                 # We also try looking in get_video_info since it may contain different dashmpd
                 # URL that points to a DASH manifest with possibly different itag set (some itags
@@ -1657,6 +1667,10 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                     if not video_info_webpage:
                         continue
                     get_video_info = compat_parse_qs(video_info_webpage)
+                    if not player_response:
+                        pl_response = get_video_info.get('player_response', [None])[0]
+                        if isinstance(pl_response, dict):
+                            player_response = pl_response
                     add_dash_mpd(get_video_info)
                     if view_count is None:
                         view_count = extract_view_count(get_video_info)
@@ -1703,9 +1717,14 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
                     '"token" parameter not in video info for unknown reason',
                     video_id=video_id)
 
+        video_details = try_get(
+            player_response, lambda x: x['videoDetails'], dict) or {}
+
         # title
         if 'title' in video_info:
             video_title = video_info['title'][0]
+        elif 'title' in player_response:
+            video_title = video_details['title']
         else:
             self._downloader.report_warning('Unable to extract video title')
             video_title = '_'
@@ -1768,6 +1787,8 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
 
         if view_count is None:
             view_count = extract_view_count(video_info)
+        if view_count is None and video_details:
+            view_count = int_or_none(video_details.get('viewCount'))
 
         # Check for "rental" videos
         if 'ypc_video_rental_bar_text' in video_info and 'author' not in video_info:
@@ -1950,7 +1971,9 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
             raise ExtractorError('no conn, hlsvp or url_encoded_fmt_stream_map information found in video info')
 
         # uploader
-        video_uploader = try_get(video_info, lambda x: x['author'][0], compat_str)
+        video_uploader = try_get(
+            video_info, lambda x: x['author'][0],
+            compat_str) or str_or_none(video_details.get('author'))
         if video_uploader:
             video_uploader = compat_urllib_parse_unquote_plus(video_uploader)
         else:
@@ -2059,6 +2082,11 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
         like_count = _extract_count('like')
         dislike_count = _extract_count('dislike')
 
+        if view_count is None:
+            view_count = str_to_int(self._search_regex(
+                r'<[^>]+class=["\']watch-view-count[^>]+>\s*([\d,\s]+)', video_webpage,
+                'view count', default=None))
+
         # subtitles
         video_subtitles = self._get_subtitles(video_id, video_webpage)
         automatic_captions = self._get_automatic_captions(video_id, video_webpage)
@@ -2066,6 +2094,8 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
         video_duration = try_get(
             video_info, lambda x: int_or_none(x['length_seconds'][0]))
         if not video_duration:
+            video_duration = int_or_none(video_details.get('lengthSeconds'))
+        if not video_duration:
             video_duration = parse_duration(self._html_search_meta(
                 'duration', video_webpage, 'video duration'))
author	James Taylor <user234683@users.noreply.github.com>	2018-11-05 01:29:50 -0800
committer	James Taylor <user234683@users.noreply.github.com>	2018-11-05 01:29:50 -0800
commit	4b9e9529bed5c8366f8ba67db8fae27cf335b852 (patch)
tree	637bd4df6fd3648065de34efc4c106d805b7e58c
parent	8784070e75685086b2c1db2973e2082743da6296 (diff)
download	yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.tar.lz yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.tar.xz yt-local-4b9e9529bed5c8366f8ba67db8fae27cf335b852.zip