From e158c4842b123944137b985e5d436ecebd2f51f4 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Fri, 15 Feb 2019 20:27:37 -0800
Subject: subscriptions: basic database code

---
 youtube/subscriptions.py | 82 +++++++++++++++++++++++++++++++++++++++++-------
 1 file changed, 70 insertions(+), 12 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 47f1ea3..39957bf 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -1,18 +1,76 @@
-import urllib
+from youtube import common, settings
+import sqlite3
+import os
 
-with open("subscriptions.txt", 'r', encoding='utf-8') as file:
-    subscriptions = file.read()
-    
-# Line format: "channel_id channel_name"
-# Example:
-# UCYO_jab_esuFRV4b17AJtAw 3Blue1Brown
+# https://stackabuse.com/a-sqlite-tutorial-with-python/
 
-subscriptions = ((line[0:24], line[25: ]) for line in subscriptions.splitlines())
+database_path = os.path.join(settings.data_dir, "subscriptions.sqlite")
 
-def get_new_videos():
-    for channel_id, channel_name in subscriptions:
-        
+def open_database():
+    if not os.path.exists(settings.data_dir):
+        os.makedirs(settings.data_dir)
+    connection = sqlite3.connect(database_path)
 
+    # Create tables if they don't exist
+    try:
+        cursor = connection.cursor()
+        cursor.execute('''CREATE TABLE IF NOT EXISTS subscribed_channels (
+                              id integer PRIMARY KEY,
+                              channel_id text NOT NULL,
+                              channel_name text NOT NULL,
+                              time_last_checked integer
+                          )''')
+        cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
+                              id integer PRIMARY KEY,
+                              uploader_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
+                              video_id text NOT NULL,
+                              title text NOT NULL,
+                              time_published integer NOT NULL,
+                              description text,
+                          )''')
+        connection.commit()
+    except:
+        connection.rollback()
+        connection.close()
+        raise
 
+    return connection
 
-def get_subscriptions_page():
+def _subscribe(channel_id, channel_name):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        cursor.execute("INSERT INTO subscribed_channels (channel_id, name) VALUES (?, ?)", (channel_id, channel_name))
+        connection.commit()
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+def _unsubscribe(channel_id):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        cursor.execute("DELETE FROM subscribed_channels WHERE channel_id=?", (channel_id, ))
+        connection.commit()
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+def _get_videos(number, offset):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        cursor.execute('''SELECT video_id, title, time_published, description, channel_id, channel_name
+                          FROM videos
+                          INNER JOIN subscribed_channels on videos.uploader_id = subscribed_channels.id
+                          ORDER BY time_published DESC
+                          LIMIT ? OFFSET ?''', number, offset)
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
-- 
cgit v1.2.3


From c65df7d27df64049e1597e245758f70e808173e1 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 16 Feb 2019 14:00:06 -0800
Subject: subscriptions: Basic new videos checking function for channel

---
 youtube/subscriptions.py | 103 ++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 102 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 39957bf..0d31bd4 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -1,6 +1,14 @@
-from youtube import common, settings
+from youtube import common, settings, channel
 import sqlite3
 import os
+import secrets
+import datetime
+
+# so as to not completely break on people who have updated but don't know of new dependency
+try:
+    import atoma
+except ModuleNotFoundError:
+    print('Error: atoma not installed, subscriptions will not work')
 
 # https://stackabuse.com/a-sqlite-tutorial-with-python/
 
@@ -74,3 +82,96 @@ def _get_videos(number, offset):
         raise
     finally:
         connection.close()
+
+
+
+units = {
+    'year': 31536000,   # 365*24*3600
+    'month': 2592000,   # 30*24*3600
+    'week': 604800,     # 7*24*3600
+    'day':  86400,      # 24*3600
+    'hour': 3600,
+    'minute': 60,
+    'second': 1,
+}
+def youtube_timestamp_to_posix(dumb_timestamp):
+    ''' Given a dumbed down timestamp such as 1 year ago, 3 hours ago,
+         approximates the unix time (seconds since 1/1/1970) '''
+    dumb_timestamp = dumb_timestamp.lower()
+    now = time.time()
+    if dumb_timestamp == "just now":
+        return now
+    split = dumb_timestamp.split(' ')
+    number, unit = int(split[0]), split[1]
+    if number > 1:
+        unit = unit[:-1]    # remove s from end
+    return now - number*units[unit]
+
+
+weekdays = ('Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun')
+months = ('Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec')
+def _get_upstream_videos(channel_id, channel_name, time_last_checked):
+    feed_url = "https://www.youtube.com/feeds/videos.xml?channel_id=" + channel_id
+    headers = {}
+
+    # randomly change time_last_checked up to one day earlier to make tracking harder
+    time_last_checked = time_last_checked - secrets.randbelow(24*3600)
+
+    # If-Modified-Since header: https://developer.mozilla.org/en-US/docs/Web/HTTP/Headers/If-Modified-Since
+    struct_time = time.gmtime(time_last_checked)
+    weekday = weekdays[struct_time.tm_wday]     # dumb requirement
+    month = months[struct_time.tm_mon - 1]
+    headers['If-Modified-Since'] = time.strftime(weekday + ', %d ' + month + ' %Y %H:%M:%S GMT', struct_time)
+    print(headers['If-Modified-Since'])
+
+
+    headers['User-Agent'] = 'Python-urllib'     # Don't leak python version
+    headers['Accept-Encoding'] = 'gzip, br'
+    req = urllib.request.Request(url, headers=headers)
+    if settings.route_tor:
+        opener = urllib.request.build_opener(sockshandler.SocksiPyHandler(socks.PROXY_TYPE_SOCKS5, "127.0.0.1", 9150))
+    else:
+        opener = urllib.request.build_opener()
+    response = opener.open(req, timeout=15)
+
+
+    if response.getcode == '304':
+        print('No new videos for ' + channel_id)
+        return []
+
+
+    content = response.read()
+    print('Retrieved videos for ' + channel_id)
+    content = common.decode_content(content, response.getheader('Content-Encoding', default='identity'))
+
+
+    feed = atoma.parse_atom_bytes(content)
+    atom_videos = {}
+    for entry in feed.entries:
+        video_id = entry.id_[9:]     # example of id_: yt:video:q6EoRBvdVPQ
+
+        # standard names used in this program for purposes of html templating
+        atom_videos[video_id] = {
+            'title': entry.title.value,
+            'author': entry.authors[0].name,
+            #'description': '',              # Not supported by atoma
+            #'duration': '',                 # Youtube's atom feeds don't provide it.. very frustrating
+            'published':    entry.published.strftime('%m/%d/%Y'),
+            'time_published':   int(entry.published.timestamp()),
+        }
+
+
+    # final list
+    videos = []
+
+    # Now check channel page to retrieve missing information for videos
+    json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
+    for json_video in json_channel_videos:
+        info = renderer_info(json_video)
+        if info['id'] in atom_videos:
+            info.update(atom_videos[info['id']])
+        else:
+            info['author'] = channel_name
+            info['time published'] = youtube_timestamp_to_posix(info['published'])
+        videos.append(info)
+    return videos
-- 
cgit v1.2.3


From 4a54c4fe301f37ae63e98defe8240a5d526361c6 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 16 Feb 2019 16:11:53 -0800
Subject: subscriptions: store video duration in database

---
 youtube/subscriptions.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 0d31bd4..a0f7e48 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -33,6 +33,7 @@ def open_database():
                               uploader_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
                               video_id text NOT NULL,
                               title text NOT NULL,
+                              duration text,
                               time_published integer NOT NULL,
                               description text,
                           )''')
@@ -72,7 +73,7 @@ def _get_videos(number, offset):
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.execute('''SELECT video_id, title, time_published, description, channel_id, channel_name
+        cursor.execute('''SELECT video_id, title, duration, time_published, description, channel_id, channel_name
                           FROM videos
                           INNER JOIN subscribed_channels on videos.uploader_id = subscribed_channels.id
                           ORDER BY time_published DESC
-- 
cgit v1.2.3


From 24642455d0dc5841ddec99f456598c4f763c1e8a Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 16 Feb 2019 16:56:46 -0800
Subject: subscriptions page

---
 youtube/subscriptions.py | 37 +++++++++++++++++++++++++++++++++----
 youtube/youtube.py       |  4 +++-
 2 files changed, 36 insertions(+), 5 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index a0f7e48..82916dd 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -1,4 +1,6 @@
-from youtube import common, settings, channel
+from youtube import common, channel
+import settings
+from string import Template
 import sqlite3
 import os
 import secrets
@@ -10,6 +12,10 @@ try:
 except ModuleNotFoundError:
     print('Error: atoma not installed, subscriptions will not work')
 
+with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
+    subscriptions_template = Template(f.read())
+
+
 # https://stackabuse.com/a-sqlite-tutorial-with-python/
 
 database_path = os.path.join(settings.data_dir, "subscriptions.sqlite")
@@ -35,7 +41,7 @@ def open_database():
                               title text NOT NULL,
                               duration text,
                               time_published integer NOT NULL,
-                              description text,
+                              description text
                           )''')
         connection.commit()
     except:
@@ -73,11 +79,19 @@ def _get_videos(number, offset):
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.execute('''SELECT video_id, title, duration, time_published, description, channel_id, channel_name
+        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
                           FROM videos
                           INNER JOIN subscribed_channels on videos.uploader_id = subscribed_channels.id
                           ORDER BY time_published DESC
-                          LIMIT ? OFFSET ?''', number, offset)
+                          LIMIT ? OFFSET ?''', (number, offset))
+
+        for db_video in db_videos:
+            yield {
+                'id':   db_video[0],
+                'title':    db_video[1],
+                'duration': db_video[2],
+                'author':   db_video[3],
+            }
     except:
         connection.rollback()
         raise
@@ -176,3 +190,18 @@ def _get_upstream_videos(channel_id, channel_name, time_last_checked):
             info['time published'] = youtube_timestamp_to_posix(info['published'])
         videos.append(info)
     return videos
+
+def get_subscriptions_page(env, start_response):
+    items_html = '''<nav class="item-grid">\n'''
+
+    for item in _get_videos(30, 0):
+        items_html += common.video_item_html(info, common.small_video_item_template)
+    items_html += '''\n</nav>'''
+
+    start_response('200 OK', [('Content-type','text/html'),])
+    return subscriptions_template.substitute(
+        header = common.get_header(),
+        items = items_html,
+        page_buttons = '',
+    ).encode('utf-8')
+
diff --git a/youtube/youtube.py b/youtube/youtube.py
index b6b12fb..ad73a6e 100644
--- a/youtube/youtube.py
+++ b/youtube/youtube.py
@@ -1,7 +1,7 @@
 import mimetypes
 import urllib.parse
 import os
-from youtube import local_playlist, watch, search, playlist, channel, comments, common, post_comment, accounts
+from youtube import local_playlist, watch, search, playlist, channel, comments, common, post_comment, accounts, subscriptions
 import settings
 YOUTUBE_FILES = (
     "/shared.css",
@@ -24,6 +24,8 @@ get_handlers = {
     'post_comment':     post_comment.get_post_comment_page,
     'delete_comment':   post_comment.get_delete_comment_page,
     'login':            accounts.get_account_login_page,
+
+    'subscriptions':    subscriptions.get_subscriptions_page,
 }
 post_handlers = {
     'edit_playlist':    local_playlist.edit_playlist,
-- 
cgit v1.2.3


From 3905e7e64059b45479894ba1fdfb0ef9cef64475 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 16 Feb 2019 23:41:52 -0800
Subject: basic subscriptions system

---
 youtube/channel.py       |  4 +++
 youtube/subscriptions.py | 71 +++++++++++++++++++++++++++++++++++++++---------
 youtube/youtube.py       |  2 ++
 3 files changed, 64 insertions(+), 13 deletions(-)

(limited to 'youtube')

diff --git a/youtube/channel.py b/youtube/channel.py
index 9577525..c83d7d1 100644
--- a/youtube/channel.py
+++ b/youtube/channel.py
@@ -248,6 +248,7 @@ def channel_videos_html(polymer_json, current_page=1, current_sort=3, number_of_
     return yt_channel_items_template.substitute(
         header              = common.get_header(),
         channel_title       = microformat['title'],
+        channel_id          = channel_id,
         channel_tabs        = channel_tabs_html(channel_id, 'Videos'),
         sort_buttons        = channel_sort_buttons_html(channel_id, 'videos', current_sort),
         avatar              = '/' + microformat['thumbnail']['thumbnails'][0]['url'],
@@ -269,6 +270,7 @@ def channel_playlists_html(polymer_json, current_sort=3):
     return yt_channel_items_template.substitute(
         header              = common.get_header(),
         channel_title       = microformat['title'],
+        channel_id          = channel_id,
         channel_tabs        = channel_tabs_html(channel_id, 'Playlists'),
         sort_buttons        = channel_sort_buttons_html(channel_id, 'playlists', current_sort),
         avatar              = '/' + microformat['thumbnail']['thumbnails'][0]['url'],
@@ -333,6 +335,7 @@ def channel_about_page(polymer_json):
         description         = description,
         links               = channel_links,
         stats               = stats,
+        channel_id          = channel_metadata['channelId'],
         channel_tabs        = channel_tabs_html(channel_metadata['channelId'], 'About'),
     )
 
@@ -353,6 +356,7 @@ def channel_search_page(polymer_json, query, current_page=1, number_of_videos =
     return yt_channel_items_template.substitute(
         header              = common.get_header(),
         channel_title       = html.escape(microformat['title']),
+        channel_id          = channel_id,
         channel_tabs        = channel_tabs_html(channel_id, '', query),
         avatar              = '/' + microformat['thumbnail']['thumbnails'][0]['url'],
         page_title          = html.escape(query + ' - Channel search'),
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 82916dd..ff7d0df 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -5,6 +5,10 @@ import sqlite3
 import os
 import secrets
 import datetime
+import itertools
+import time
+import urllib
+import socks, sockshandler
 
 # so as to not completely break on people who have updated but don't know of new dependency
 try:
@@ -51,11 +55,16 @@ def open_database():
 
     return connection
 
-def _subscribe(channel_id, channel_name):
+def _subscribe(channels):
+    ''' channels is a list of (channel_id, channel_name) '''
+
+    # set time_last_checked to 0 on all channels being subscribed to
+    channels = ( (channel_id, channel_name, 0) for channel_id, channel_name in channels)
+
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.execute("INSERT INTO subscribed_channels (channel_id, name) VALUES (?, ?)", (channel_id, channel_name))
+        cursor.executemany("INSERT INTO subscribed_channels (channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
         connection.commit()
     except:
         connection.rollback()
@@ -63,11 +72,12 @@ def _subscribe(channel_id, channel_name):
     finally:
         connection.close()
 
-def _unsubscribe(channel_id):
+def _unsubscribe(channel_ids):
+    ''' channel_ids is a list of channel_ids '''
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.execute("DELETE FROM subscribed_channels WHERE channel_id=?", (channel_id, ))
+        cursor.executemany("DELETE FROM subscribed_channels WHERE channel_id=?", ((channel_id, ) for channel_id in channel_ids))
         connection.commit()
     except:
         connection.rollback()
@@ -125,12 +135,14 @@ def youtube_timestamp_to_posix(dumb_timestamp):
 
 weekdays = ('Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun')
 months = ('Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec')
-def _get_upstream_videos(channel_id, channel_name, time_last_checked):
+def _get_upstream_videos(channel_id, time_last_checked):
     feed_url = "https://www.youtube.com/feeds/videos.xml?channel_id=" + channel_id
     headers = {}
 
     # randomly change time_last_checked up to one day earlier to make tracking harder
     time_last_checked = time_last_checked - secrets.randbelow(24*3600)
+    if time_last_checked < 0:   # happens when time_last_checked is initialized to 0 when checking for first time
+        time_last_checked = 0
 
     # If-Modified-Since header: https://developer.mozilla.org/en-US/docs/Web/HTTP/Headers/If-Modified-Since
     struct_time = time.gmtime(time_last_checked)
@@ -142,7 +154,7 @@ def _get_upstream_videos(channel_id, channel_name, time_last_checked):
 
     headers['User-Agent'] = 'Python-urllib'     # Don't leak python version
     headers['Accept-Encoding'] = 'gzip, br'
-    req = urllib.request.Request(url, headers=headers)
+    req = urllib.request.Request(feed_url, headers=headers)
     if settings.route_tor:
         opener = urllib.request.build_opener(sockshandler.SocksiPyHandler(socks.PROXY_TYPE_SOCKS5, "127.0.0.1", 9150))
     else:
@@ -165,13 +177,10 @@ def _get_upstream_videos(channel_id, channel_name, time_last_checked):
     for entry in feed.entries:
         video_id = entry.id_[9:]     # example of id_: yt:video:q6EoRBvdVPQ
 
-        # standard names used in this program for purposes of html templating
         atom_videos[video_id] = {
             'title': entry.title.value,
-            'author': entry.authors[0].name,
             #'description': '',              # Not supported by atoma
             #'duration': '',                 # Youtube's atom feeds don't provide it.. very frustrating
-            'published':    entry.published.strftime('%m/%d/%Y'),
             'time_published':   int(entry.published.timestamp()),
         }
 
@@ -182,12 +191,13 @@ def _get_upstream_videos(channel_id, channel_name, time_last_checked):
     # Now check channel page to retrieve missing information for videos
     json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
     for json_video in json_channel_videos:
-        info = renderer_info(json_video)
+        info = common.renderer_info(json_video['gridVideoRenderer'])
+        if 'description' not in info:
+            info['description'] = ''
         if info['id'] in atom_videos:
             info.update(atom_videos[info['id']])
         else:
-            info['author'] = channel_name
-            info['time published'] = youtube_timestamp_to_posix(info['published'])
+            info['time_published'] = youtube_timestamp_to_posix(info['published'])
         videos.append(info)
     return videos
 
@@ -195,7 +205,7 @@ def get_subscriptions_page(env, start_response):
     items_html = '''<nav class="item-grid">\n'''
 
     for item in _get_videos(30, 0):
-        items_html += common.video_item_html(info, common.small_video_item_template)
+        items_html += common.video_item_html(item, common.small_video_item_template)
     items_html += '''\n</nav>'''
 
     start_response('200 OK', [('Content-type','text/html'),])
@@ -205,3 +215,38 @@ def get_subscriptions_page(env, start_response):
         page_buttons = '',
     ).encode('utf-8')
 
+def post_subscriptions_page(env, start_response):
+    params = env['parameters']
+    action = params['action'][0]
+    if action == 'subscribe':
+        if len(params['channel_id']) != len(params['channel_name']):
+            start_response('400 Bad Request', ())
+            return b'400 Bad Request, length of channel_id != length of channel_name'
+        _subscribe(zip(params['channel_id'], params['channel_name']))
+
+    elif action == 'unsubscribe':
+        _unsubscribe(params['channel_id'])
+
+    elif action == 'refresh':
+        connection = open_database()
+        try:
+            cursor = connection.cursor()
+            for uploader_id, channel_id, time_last_checked in cursor.execute('''SELECT id, channel_id, time_last_checked FROM subscribed_channels'''):
+                db_videos = ( (uploader_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(channel_id, time_last_checked) )
+                cursor.executemany('''INSERT INTO videos (uploader_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
+
+            cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
+            connection.commit()
+        except:
+            connection.rollback()
+            raise
+        finally:
+            connection.close()
+
+        start_response('303 See Other', [('Location', common.URL_ORIGIN + '/subscriptions'),] )
+        return b''
+    else:
+        start_response('400 Bad Request', ())
+        return b'400 Bad Request'
+    start_response('204 No Content', ())
+    return b''
diff --git a/youtube/youtube.py b/youtube/youtube.py
index ad73a6e..288f68b 100644
--- a/youtube/youtube.py
+++ b/youtube/youtube.py
@@ -35,6 +35,8 @@ post_handlers = {
     'comments':         post_comment.post_comment,
     'post_comment':     post_comment.post_comment,
     'delete_comment':   post_comment.delete_comment,
+
+    'subscriptions':    subscriptions.post_subscriptions_page,
 }
 
 def youtube(env, start_response):
-- 
cgit v1.2.3


From 1807bfac4952c23dd4031007b44026e920951336 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 3 Jun 2019 02:05:30 -0700
Subject: Remove feed parsing for now since youtube doesn't honor
 If-Modified-Since header

---
 youtube/subscriptions.py | 71 +++---------------------------------------------
 1 file changed, 4 insertions(+), 67 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 0c7e8a5..a7b94bc 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -10,12 +10,6 @@ import time
 import urllib
 import socks, sockshandler
 
-# so as to not completely break on people who have updated but don't know of new dependency
-try:
-    import atoma
-except ModuleNotFoundError:
-    print('Error: atoma not installed, subscriptions will not work')
-
 with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
     subscriptions_template = Template(f.read())
 
@@ -132,72 +126,15 @@ def youtube_timestamp_to_posix(dumb_timestamp):
         unit = unit[:-1]    # remove s from end
     return now - number*units[unit]
 
-
-weekdays = ('Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun')
-months = ('Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec')
-def _get_upstream_videos(channel_id, time_last_checked):
-    feed_url = "https://www.youtube.com/feeds/videos.xml?channel_id=" + channel_id
-    headers = {}
-
-    # randomly change time_last_checked up to one day earlier to make tracking harder
-    time_last_checked = time_last_checked - secrets.randbelow(24*3600)
-    if time_last_checked < 0:   # happens when time_last_checked is initialized to 0 when checking for first time
-        time_last_checked = 0
-
-    # If-Modified-Since header: https://developer.mozilla.org/en-US/docs/Web/HTTP/Headers/If-Modified-Since
-    struct_time = time.gmtime(time_last_checked)
-    weekday = weekdays[struct_time.tm_wday]     # dumb requirement
-    month = months[struct_time.tm_mon - 1]
-    headers['If-Modified-Since'] = time.strftime(weekday + ', %d ' + month + ' %Y %H:%M:%S GMT', struct_time)
-    print(headers['If-Modified-Since'])
-
-
-    headers['User-Agent'] = 'Python-urllib'     # Don't leak python version
-    headers['Accept-Encoding'] = 'gzip, br'
-    req = urllib.request.Request(feed_url, headers=headers)
-    if settings.route_tor:
-        opener = urllib.request.build_opener(sockshandler.SocksiPyHandler(socks.PROXY_TYPE_SOCKS5, "127.0.0.1", 9150))
-    else:
-        opener = urllib.request.build_opener()
-    response = opener.open(req, timeout=15)
-
-
-    if response.getcode == '304':
-        print('No new videos for ' + channel_id)
-        return []
-
-
-    content = response.read()
-    print('Retrieved videos for ' + channel_id)
-    content = util.decode_content(content, response.getheader('Content-Encoding', default='identity'))
-
-
-    feed = atoma.parse_atom_bytes(content)
-    atom_videos = {}
-    for entry in feed.entries:
-        video_id = entry.id_[9:]     # example of id_: yt:video:q6EoRBvdVPQ
-
-        atom_videos[video_id] = {
-            'title': entry.title.value,
-            #'description': '',              # Not supported by atoma
-            #'duration': '',                 # Youtube's atom feeds don't provide it.. very frustrating
-            'time_published':   int(entry.published.timestamp()),
-        }
-
-
-    # final list
+def _get_upstream_videos(channel_id):
     videos = []
 
-    # Now check channel page to retrieve missing information for videos
     json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
     for json_video in json_channel_videos:
         info = yt_data_extract.renderer_info(json_video['gridVideoRenderer'])
         if 'description' not in info:
             info['description'] = ''
-        if info['id'] in atom_videos:
-            info.update(atom_videos[info['id']])
-        else:
-            info['time_published'] = youtube_timestamp_to_posix(info['published'])
+        info['time_published'] = youtube_timestamp_to_posix(info['published'])
         videos.append(info)
     return videos
 
@@ -231,8 +168,8 @@ def post_subscriptions_page(env, start_response):
         connection = open_database()
         try:
             cursor = connection.cursor()
-            for uploader_id, channel_id, time_last_checked in cursor.execute('''SELECT id, channel_id, time_last_checked FROM subscribed_channels'''):
-                db_videos = ( (uploader_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(channel_id, time_last_checked) )
+            for uploader_id, channel_id in cursor.execute('''SELECT id, channel_id FROM subscribed_channels'''):
+                db_videos = ( (uploader_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(channel_id) )
                 cursor.executemany('''INSERT INTO videos (uploader_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
 
             cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
-- 
cgit v1.2.3


From ccb795e31f2f9944b1c8b061906eb752009f8ea7 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 3 Jun 2019 03:20:44 -0700
Subject: Ensure videos in subscriptions from same channel in order

---
 youtube/subscriptions.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index a7b94bc..dc8412b 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -130,11 +130,11 @@ def _get_upstream_videos(channel_id):
     videos = []
 
     json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
-    for json_video in json_channel_videos:
+    for i, json_video in enumerate(json_channel_videos):
         info = yt_data_extract.renderer_info(json_video['gridVideoRenderer'])
         if 'description' not in info:
             info['description'] = ''
-        info['time_published'] = youtube_timestamp_to_posix(info['published'])
+        info['time_published'] = youtube_timestamp_to_posix(info['published']) - i  # subtract a few seconds off the videos so they will be in the right order
         videos.append(info)
     return videos
 
-- 
cgit v1.2.3


From ae5fd9eb009c6522e7d7971e0bdea57faaaf2b3c Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Wed, 5 Jun 2019 00:41:15 -0700
Subject: Make thumbnails work and other stuff

---
 youtube/local_playlist.py | 30 ++-------------------------
 youtube/subscriptions.py  | 53 ++++++++++++++++++++++++++++++++++++++---------
 youtube/util.py           | 32 ++++++++++++++++++++++++++++
 youtube/youtube.py        |  2 +-
 4 files changed, 78 insertions(+), 39 deletions(-)

(limited to 'youtube')

diff --git a/youtube/local_playlist.py b/youtube/local_playlist.py
index e354013..d083e33 100644
--- a/youtube/local_playlist.py
+++ b/youtube/local_playlist.py
@@ -33,33 +33,7 @@ def add_to_playlist(name, video_info_list):
             if id not in ids:
                 file.write(info + "\n")
                 missing_thumbnails.append(id)
-    gevent.spawn(download_thumbnails, name, missing_thumbnails)
-
-def download_thumbnail(playlist_name, video_id):
-    url = "https://i.ytimg.com/vi/" + video_id + "/mqdefault.jpg"
-    save_location = os.path.join(thumbnails_directory, playlist_name, video_id + ".jpg")
-    try:
-        thumbnail = util.fetch_url(url, report_text="Saved local playlist thumbnail: " + video_id)
-    except urllib.error.HTTPError as e:
-        print("Failed to download thumbnail for " + video_id + ": " + str(e))
-        return
-    try:
-        f = open(save_location, 'wb')
-    except FileNotFoundError:
-        os.makedirs(os.path.join(thumbnails_directory, playlist_name))
-        f = open(save_location, 'wb')
-    f.write(thumbnail)
-    f.close()
-
-def download_thumbnails(playlist_name, ids):
-    # only do 5 at a time
-    # do the n where n is divisible by 5
-    i = -1
-    for i in range(0, int(len(ids)/5) - 1 ):
-        gevent.joinall([gevent.spawn(download_thumbnail, playlist_name, ids[j]) for j in range(i*5, i*5 + 5)])
-    # do the remainders (< 5)
-    gevent.joinall([gevent.spawn(download_thumbnail, playlist_name, ids[j]) for j in range(i*5 + 5, len(ids))])
-            
+    gevent.spawn(util.download_thumbnails, os.path.join(thumbnails_directory, name), missing_thumbnails)
         
 
 def get_local_playlist_page(name):
@@ -84,7 +58,7 @@ def get_local_playlist_page(name):
             videos_html += html_common.video_item_html(info, html_common.small_video_item_template)
         except json.decoder.JSONDecodeError:
             pass
-    gevent.spawn(download_thumbnails, name, missing_thumbnails)
+    gevent.spawn(util.download_thumbnails, os.path.join(thumbnails_directory, name), missing_thumbnails)
     return local_playlist_template.substitute(
         page_title = name + ' - Local playlist',
         header = html_common.get_header(),
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index dc8412b..93d064d 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -3,16 +3,13 @@ import settings
 from string import Template
 import sqlite3
 import os
-import secrets
-import datetime
-import itertools
 import time
-import urllib
-import socks, sockshandler
+import gevent
 
 with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
     subscriptions_template = Template(f.read())
 
+thumbnails_directory = os.path.join(settings.data_dir, "subscription_thumbnails")
 
 # https://stackabuse.com/a-sqlite-tutorial-with-python/
 
@@ -28,14 +25,14 @@ def open_database():
         cursor = connection.cursor()
         cursor.execute('''CREATE TABLE IF NOT EXISTS subscribed_channels (
                               id integer PRIMARY KEY,
-                              channel_id text NOT NULL,
+                              channel_id text UNIQUE NOT NULL,
                               channel_name text NOT NULL,
                               time_last_checked integer
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
                               id integer PRIMARY KEY,
                               uploader_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
-                              video_id text NOT NULL,
+                              video_id text UNIQUE NOT NULL,
                               title text NOT NULL,
                               duration text,
                               time_published integer NOT NULL,
@@ -58,7 +55,7 @@ def _subscribe(channels):
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.executemany("INSERT INTO subscribed_channels (channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
+        cursor.executemany("INSERT OR IGNORE INTO subscribed_channels (channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
         connection.commit()
     except:
         connection.rollback()
@@ -104,6 +101,10 @@ def _get_videos(number, offset):
 
 
+
+
+
+
 units = {
     'year': 31536000,   # 365*24*3600
     'month': 2592000,   # 30*24*3600
@@ -126,6 +127,16 @@ def youtube_timestamp_to_posix(dumb_timestamp):
         unit = unit[:-1]    # remove s from end
     return now - number*units[unit]
 
+# Use this to mark a thumbnail acceptable to be retrieved at the request of the browser
+downloading_thumbnails = set()
+def download_thumbnails(thumbnails_directory, thumbnails):
+    try:
+        g = gevent.spawn(util.download_thumbnails, thumbnails_directory, thumbnails)
+        g.join()
+    finally:
+        downloading_thumbnails.difference_update(thumbnails)
+
+
 def _get_upstream_videos(channel_id):
     videos = []
 
@@ -136,12 +147,34 @@ def _get_upstream_videos(channel_id):
             info['description'] = ''
         info['time_published'] = youtube_timestamp_to_posix(info['published']) - i  # subtract a few seconds off the videos so they will be in the right order
         videos.append(info)
+
+    try:
+        existing_thumbnails = set(os.path.splitext(name)[0] for name in os.listdir(thumbnails_directory))
+    except FileNotFoundError:
+        existing_thumbnails = set()
+    missing_thumbnails = set(video['id'] for video in videos) - existing_thumbnails
+    downloading_thumbnails.update(missing_thumbnails)
+    gevent.spawn(download_thumbnails, thumbnails_directory, missing_thumbnails)
+
     return videos
 
+
+
+
+
+
+
+
+
 def get_subscriptions_page(env, start_response):
     items_html = '''<nav class="item-grid">\n'''
 
     for item in _get_videos(30, 0):
+        print("Downloading_thumbnails: ", downloading_thumbnails)
+        if item['id'] in downloading_thumbnails:
+            item['thumbnail'] = util.get_thumbnail_url(item['id'])
+        else:
+            item['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + item['id'] + '.jpg'
         items_html += html_common.video_item_html(item, html_common.small_video_item_template)
     items_html += '''\n</nav>'''
 
@@ -168,9 +201,9 @@ def post_subscriptions_page(env, start_response):
         connection = open_database()
         try:
             cursor = connection.cursor()
-            for uploader_id, channel_id in cursor.execute('''SELECT id, channel_id FROM subscribed_channels'''):
+            for uploader_id, channel_id in cursor.execute('''SELECT id, channel_id FROM subscribed_channels''').fetchall():
                 db_videos = ( (uploader_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(channel_id) )
-                cursor.executemany('''INSERT INTO videos (uploader_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
+                cursor.executemany('''INSERT OR IGNORE INTO videos (uploader_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
 
             cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
             connection.commit()
diff --git a/youtube/util.py b/youtube/util.py
index 9950815..42d76a3 100644
--- a/youtube/util.py
+++ b/youtube/util.py
@@ -5,6 +5,8 @@ import brotli
 import urllib.parse
 import re
 import time
+import os
+import gevent
 
 # The trouble with the requests library: It ships its own certificate bundle via certifi
 #  instead of using the system certificate store, meaning self-signed certificates
@@ -176,6 +178,36 @@ desktop_ua = (('User-Agent', desktop_user_agent),)
 
 
+def download_thumbnail(save_directory, video_id):
+    url = "https://i.ytimg.com/vi/" + video_id + "/mqdefault.jpg"
+    save_location = os.path.join(save_directory, video_id + ".jpg")
+    try:
+        thumbnail = fetch_url(url, report_text="Saved thumbnail: " + video_id)
+    except urllib.error.HTTPError as e:
+        print("Failed to download thumbnail for " + video_id + ": " + str(e))
+        return
+    try:
+        f = open(save_location, 'wb')
+    except FileNotFoundError:
+        os.makedirs(save_directory)
+        f = open(save_location, 'wb')
+    f.write(thumbnail)
+    f.close()
+
+def download_thumbnails(save_directory, ids):
+    if not isinstance(ids, (list, tuple)):
+        ids = list(ids)
+    # only do 5 at a time
+    # do the n where n is divisible by 5
+    i = -1
+    for i in range(0, int(len(ids)/5) - 1 ):
+        gevent.joinall([gevent.spawn(download_thumbnail, save_directory, ids[j]) for j in range(i*5, i*5 + 5)])
+    # do the remainders (< 5)
+    gevent.joinall([gevent.spawn(download_thumbnail, save_directory, ids[j]) for j in range(i*5 + 5, len(ids))])
+
+
+
+
 
 
 def dict_add(*dicts):
diff --git a/youtube/youtube.py b/youtube/youtube.py
index 4ec7962..c629bbb 100644
--- a/youtube/youtube.py
+++ b/youtube/youtube.py
@@ -61,7 +61,7 @@ def youtube(env, start_response):
                 start_response('200 OK',  (('Content-type',mime_type),) )
                 return f.read()
 
-        elif path.startswith("/data/playlist_thumbnails/"):
+        elif path.startswith('/data/playlist_thumbnails/') or path.startswith('/data/subscription_thumbnails/'):
             with open(os.path.join(settings.data_dir, os.path.normpath(path[6:])), 'rb') as f:
                 start_response('200 OK',  (('Content-type', "image/jpeg"),) )
                 return f.read()
-- 
cgit v1.2.3


From 60fe4b2e75e8475b20001c84e01b642a3b3ebcc3 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Fri, 7 Jun 2019 21:15:16 -0700
Subject: Add subscription manager system

---
 youtube/shared.css       |   5 +-
 youtube/subscriptions.py | 284 +++++++++++++++++++++++++++++++++++++++++++++--
 youtube/youtube.py       |  59 +++++++++-
 3 files changed, 334 insertions(+), 14 deletions(-)

(limited to 'youtube')

diff --git a/youtube/shared.css b/youtube/shared.css
index 1b25d7f..cd82164 100644
--- a/youtube/shared.css
+++ b/youtube/shared.css
@@ -1,7 +1,10 @@
+* {
+    box-sizing: border-box;
+}
+
 h1, h2, h3, h4, h5, h6, div, button{
     margin:0;
     padding:0;
-    
 }
 
 
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 93d064d..4591f32 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -5,10 +5,17 @@ import sqlite3
 import os
 import time
 import gevent
+import html
+import json
+import traceback
 
 with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
     subscriptions_template = Template(f.read())
 
+with open('yt_subscription_manager_template.html', 'r', encoding='utf-8') as f:
+    subscription_manager_template = Template(f.read())
+
+
 thumbnails_directory = os.path.join(settings.data_dir, "subscription_thumbnails")
 
 # https://stackabuse.com/a-sqlite-tutorial-with-python/
@@ -25,19 +32,26 @@ def open_database():
         cursor = connection.cursor()
         cursor.execute('''CREATE TABLE IF NOT EXISTS subscribed_channels (
                               id integer PRIMARY KEY,
-                              channel_id text UNIQUE NOT NULL,
+                              yt_channel_id text UNIQUE NOT NULL,
                               channel_name text NOT NULL,
                               time_last_checked integer
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
                               id integer PRIMARY KEY,
-                              uploader_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
+                              sql_channel_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
                               video_id text UNIQUE NOT NULL,
                               title text NOT NULL,
                               duration text,
                               time_published integer NOT NULL,
                               description text
                           )''')
+        cursor.execute('''CREATE TABLE IF NOT EXISTS tag_associations (
+                              id integer PRIMARY KEY,
+                              tag text NOT NULL,
+                              sql_channel_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
+                              UNIQUE(tag, sql_channel_id)
+                          )''')
+
         connection.commit()
     except:
         connection.rollback()
@@ -55,7 +69,7 @@ def _subscribe(channels):
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.executemany("INSERT OR IGNORE INTO subscribed_channels (channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
+        cursor.executemany("INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
         connection.commit()
     except:
         connection.rollback()
@@ -63,12 +77,13 @@ def _subscribe(channels):
     finally:
         connection.close()
 
+# TODO: delete thumbnails
 def _unsubscribe(channel_ids):
     ''' channel_ids is a list of channel_ids '''
     connection = open_database()
     try:
         cursor = connection.cursor()
-        cursor.executemany("DELETE FROM subscribed_channels WHERE channel_id=?", ((channel_id, ) for channel_id in channel_ids))
+        cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
         connection.commit()
     except:
         connection.rollback()
@@ -82,7 +97,7 @@ def _get_videos(number, offset):
         cursor = connection.cursor()
         db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
                           FROM videos
-                          INNER JOIN subscribed_channels on videos.uploader_id = subscribed_channels.id
+                          INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                           ORDER BY time_published DESC
                           LIMIT ? OFFSET ?''', (number, offset))
 
@@ -99,10 +114,98 @@ def _get_videos(number, offset):
     finally:
         connection.close()
 
+def _get_subscribed_channels():
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        for item in cursor.execute('''SELECT channel_name, yt_channel_id
+                                      FROM subscribed_channels
+                                      ORDER BY channel_name'''):
+            yield item
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+def _add_tags(channel_ids, tags):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+
+        pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
+
+        cursor.executemany('''INSERT OR IGNORE INTO tag_associations (tag, sql_channel_id)
+                              SELECT ?, id FROM subscribed_channels WHERE yt_channel_id = ? ''', pairs)
+        connection.commit()
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+
+
+def _remove_tags(channel_ids, tags):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+
+        pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
 
+        cursor.executemany('''DELETE FROM tag_associations WHERE tag = ? AND sql_channel_id = (
+                                          SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                                      )''', pairs)
+        connection.commit()
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
 
 
+def _get_tags(channel_id):
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
 
+        return [row[0] for row in cursor.execute('''SELECT tag
+                                      FROM tag_associations
+                                      WHERE sql_channel_id = (
+                                          SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                                      )''', (channel_id,))]
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+def _get_all_tags():
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        return [row[0] for row in cursor.execute('''SELECT DISTINCT tag FROM tag_associations''')]
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
+
+def _get_channel_names(channel_ids):
+    ''' returns list of (channel_id, channel_name) '''
+    connection = open_database()
+    try:
+        cursor = connection.cursor()
+        result = []
+        for channel_id in channel_ids:
+            row = cursor.execute('''SELECT channel_name FROM subscribed_channels WHERE yt_channel_id = ?''', (channel_id,)).fetchone()
+            result.append( (channel_id, row[0]) )
+        return result
+    except:
+        connection.rollback()
+        raise
+    finally:
+        connection.close()
 
 
 units = {
@@ -166,11 +269,156 @@ def _get_upstream_videos(channel_id):
 
 
+def import_subscriptions(env, start_response):
+    content_type = env['parameters']['subscriptions_file'][0]
+    file = env['parameters']['subscriptions_file'][1]
+
+    file = file.decode('utf-8')
+
+    if content_type == 'application/json':
+        try:
+            file = json.loads(file)
+        except json.decoder.JSONDecodeError:
+            traceback.print_exc()
+            start_response('400 Bad Request', () )
+            return b'400 Bad Request: Invalid json file'
+
+        try:
+            channels = ( (item['snippet']['resourceId']['channelId'], item['snippet']['title']) for item in file)
+        except (KeyError, IndexError):
+            traceback.print_exc()
+            start_response('400 Bad Request', () )
+            return b'400 Bad Request: Unknown json structure'
+    else:
+        raise NotImplementedError()
+
+    _subscribe(channels)
+
+    start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
+    return b''
+
+
+
+sub_list_item_template = Template('''
+<li>
+    <a href="$channel_url" class="sub-list-item-name" title="$channel_name">$channel_name</a>
+    <span class="tag-list">$tags</span>
+    <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
+</li>''')
+
+def get_subscription_manager_page(env, start_response):
+
+    sub_list_html = ''
+    for channel_name, channel_id in _get_subscribed_channels():
+        sub_list_html += sub_list_item_template.substitute(
+            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+            channel_name = html.escape(channel_name),
+            channel_id = channel_id,
+            tags = ', '.join(_get_tags(channel_id)),
+        )
+
+
+
+    start_response('200 OK', [('Content-type','text/html'),])
+    return subscription_manager_template.substitute(
+        header = html_common.get_header(),
+        sub_list = sub_list_html,
+        page_buttons = '',
+    ).encode('utf-8')
+
+def list_from_comma_separated_tags(string):
+    tags = []
+    prev_comma = -1
+    next_comma = string.find(',')
+    while next_comma != -1:
+        tag = string[prev_comma+1:next_comma].strip()
+        if tag:
+            tags.append(tag)
+
+        prev_comma = next_comma
+        next_comma = string.find(',', prev_comma+1)
+
+    last_tag = string[prev_comma+1:].strip()
+    if last_tag:
+        tags.append(last_tag)
+    return tags
+
+
+unsubscribe_list_item_template = Template('''
+<li><a href="$channel_url" title="$channel_name">$channel_name</a></li>''')
+def post_subscription_manager_page(env, start_response):
+    params = env['parameters']
+    action = params['action'][0]
+
+    if action == 'add_tags':
+        _add_tags(params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+    elif action == 'remove_tags':
+        _remove_tags(params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+    elif action == 'unsubscribe':
+        _unsubscribe(params['channel_ids'])
+    elif action == 'unsubscribe_verify':
+        page = '''
+        <span>Are you sure you want to unsubscribe from these channels?</span>
+        <form class="subscriptions-import-form" action="/youtube.com/subscription_manager" method="POST">'''
+
+        for channel_id in params['channel_ids']:
+            page += '<input type="hidden" name="channel_ids" value="' + channel_id + '">\n'
+
+        page += '''
+            <input type="hidden" name="action" value="unsubscribe">
+            <input type="submit" value="Yes, unsubscribe">
+        </form>
+        <ul>'''
+        for channel_id, channel_name in _get_channel_names(params['channel_ids']):
+            page += unsubscribe_list_item_template.substitute(
+                channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                channel_name = html.escape(channel_name),
+            )
+        page += '''</ul>'''
+
+        start_response('200 OK', [('Content-type','text/html'),])
+        return html_common.yt_basic_template.substitute(
+            page_title = 'Unsubscribe?',
+            style = '',
+            header = html_common.get_header(),
+            page = page,
+        ).encode('utf-8')
+    else:
+        start_response('400 Bad Request', ())
+        return b'400 Bad Request'
+
+    start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
+    return b''
+
+
+
+sidebar_tag_item_template = Template('''
+<li>
+    <span class="sidebar-item-name">$tag_name</span>
+    <form method="POST" class="sidebar-item-refresh">
+        <input type="submit" value="Check">
+        <input type="hidden" name="action" value="refresh">
+        <input type="hidden" name="type" value="tag">
+        <input type="hidden" name="tag_name" value="$tag_name">
+    </form>
+</li>''')
+
+
+sidebar_channel_item_template = Template('''
+<li>
+    <a href="$channel_url" class="sidebar-item-name" title="$channel_name">$channel_name</a>
+    <form method="POST" class="sidebar-item-refresh">
+        <input type="submit" value="Check">
+        <input type="hidden" name="action" value="refresh">
+        <input type="hidden" name="type" value="channel">
+        <input type="hidden" name="channel_id" value="$channel_id">
+    </form>
+</li>''')
+
 def get_subscriptions_page(env, start_response):
     items_html = '''<nav class="item-grid">\n'''
 
     for item in _get_videos(30, 0):
-        print("Downloading_thumbnails: ", downloading_thumbnails)
         if item['id'] in downloading_thumbnails:
             item['thumbnail'] = util.get_thumbnail_url(item['id'])
         else:
@@ -178,10 +426,28 @@ def get_subscriptions_page(env, start_response):
         items_html += html_common.video_item_html(item, html_common.small_video_item_template)
     items_html += '''\n</nav>'''
 
+
+    tag_list_html = ''
+    for tag_name in _get_all_tags():
+        tag_list_html += sidebar_tag_item_template.substitute(tag_name = tag_name)
+
+
+    sub_list_html = ''
+    for channel_name, channel_id in _get_subscribed_channels():
+        sub_list_html += sidebar_channel_item_template.substitute(
+            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+            channel_name = html.escape(channel_name),
+            channel_id = channel_id,
+        )
+
+
+
     start_response('200 OK', [('Content-type','text/html'),])
     return subscriptions_template.substitute(
         header = html_common.get_header(),
         items = items_html,
+        tags = tag_list_html,
+        sub_list = sub_list_html,
         page_buttons = '',
     ).encode('utf-8')
 
@@ -201,9 +467,9 @@ def post_subscriptions_page(env, start_response):
         connection = open_database()
         try:
             cursor = connection.cursor()
-            for uploader_id, channel_id in cursor.execute('''SELECT id, channel_id FROM subscribed_channels''').fetchall():
-                db_videos = ( (uploader_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(channel_id) )
-                cursor.executemany('''INSERT OR IGNORE INTO videos (uploader_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
+            for sql_channel_id, yt_channel_id in cursor.execute('''SELECT id, yt_channel_id FROM subscribed_channels''').fetchall():
+                db_videos = ( (sql_channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(yt_channel_id) )
+                cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
 
             cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
             connection.commit()
diff --git a/youtube/youtube.py b/youtube/youtube.py
index c629bbb..c0be4fe 100644
--- a/youtube/youtube.py
+++ b/youtube/youtube.py
@@ -1,6 +1,7 @@
 import mimetypes
 import urllib.parse
 import os
+import re
 from youtube import local_playlist, watch, search, playlist, channel, comments, post_comment, accounts, util, subscriptions
 import settings
 YOUTUBE_FILES = (
@@ -25,7 +26,8 @@ get_handlers = {
     'delete_comment':   post_comment.get_delete_comment_page,
     'login':            accounts.get_account_login_page,
 
-    'subscriptions':    subscriptions.get_subscriptions_page,
+    'subscriptions':            subscriptions.get_subscriptions_page,
+    'subscription_manager':     subscriptions.get_subscription_manager_page,
 }
 post_handlers = {
     'edit_playlist':    local_playlist.edit_playlist,
@@ -37,6 +39,8 @@ post_handlers = {
     'delete_comment':   post_comment.delete_comment,
 
     'subscriptions':    subscriptions.post_subscriptions_page,
+    'subscription_manager':     subscriptions.post_subscription_manager_page,
+    'import_subscriptions':     subscriptions.import_subscriptions,
 }
 
 def youtube(env, start_response):
@@ -90,9 +94,56 @@ def youtube(env, start_response):
             return channel.get_channel_page_general_url(env, start_response)
 
     elif method == "POST":
-        post_parameters = urllib.parse.parse_qs(env['wsgi.input'].read().decode())
-        env['post_parameters'] = post_parameters
-        env['parameters'].update(post_parameters)
+        content_type = env['CONTENT_TYPE']
+        if content_type == 'application/x-www-form-urlencoded':
+            post_parameters = urllib.parse.parse_qs(env['wsgi.input'].read().decode())
+            env['post_parameters'] = post_parameters
+            env['parameters'].update(post_parameters)
+
+        # Ugly hack that will be removed once I clean up this trainwreck and switch to a microframework
+        # Only supports a single file with no other fields
+        elif content_type.startswith('multipart/form-data'):
+            content = env['wsgi.input'].read()
+
+            # find double line break
+            file_start = content.find(b'\r\n\r\n')
+            if file_start == -1:
+                start_response('400 Bad Request', ())
+                return b'400 Bad Request'
+
+            file_start += 4
+
+            lines = content[0:file_start].splitlines()
+            boundary = lines[0]
+
+            file_end = content.find(boundary, file_start)
+            if file_end == -1:
+                start_response('400 Bad Request', ())
+                return b'400 Bad Request'
+            file_end -= 2  # Subtract newlines
+            file = content[file_start:file_end]
+
+            properties = dict()
+            for line in lines[1:]:
+                line = line.decode('utf-8')
+                colon = line.find(':')
+                if colon == -1:
+                    continue
+                properties[line[0:colon]] = line[colon+2:]
+
+            mime_type = properties['Content-Type']
+            field_name = re.search(r'name="([^"]*)"' , properties['Content-Disposition'])
+            if field_name is None:
+                start_response('400 Bad Request', ())
+                return b'400 Bad Request'
+            field_name = field_name.group(1)
+
+            env['post_parameters'] = {field_name: (mime_type, file)}
+            env['parameters'][field_name] = (mime_type, file)
+
+        else:
+            start_response('400 Bad Request', ())
+            return b'400 Bad Request'
 
         try:
             handler = post_handlers[path_parts[0]]
-- 
cgit v1.2.3


From c8be729e6ba706654849ed39e6238aebf85f1f36 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 8 Jun 2019 02:32:13 -0700
Subject: Reduce boilerplate in db functions with context managers

---
 youtube/subscriptions.py | 203 ++++++++++++++++-------------------------------
 1 file changed, 70 insertions(+), 133 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 4591f32..a3af40f 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -8,6 +8,7 @@ import gevent
 import html
 import json
 import traceback
+import contextlib
 
 with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
     subscriptions_template = Template(f.read())
@@ -58,7 +59,8 @@ def open_database():
         connection.close()
         raise
 
-    return connection
+    # https://stackoverflow.com/questions/19522505/using-sqlite3-in-python-with-with-keyword
+    return contextlib.closing(connection)
 
 def _subscribe(channels):
     ''' channels is a list of (channel_id, channel_name) '''
@@ -66,146 +68,88 @@ def _subscribe(channels):
     # set time_last_checked to 0 on all channels being subscribed to
     channels = ( (channel_id, channel_name, 0) for channel_id, channel_name in channels)
 
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        cursor.executemany("INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked) VALUES (?, ?, ?)", channels)
-        connection.commit()
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked)
+                                  VALUES (?, ?, ?)''', channels)
 
 # TODO: delete thumbnails
 def _unsubscribe(channel_ids):
     ''' channel_ids is a list of channel_ids '''
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
-        connection.commit()
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
 
 def _get_videos(number, offset):
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
-                          FROM videos
-                          INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
-                          ORDER BY time_published DESC
-                          LIMIT ? OFFSET ?''', (number, offset))
-
-        for db_video in db_videos:
-            yield {
-                'id':   db_video[0],
-                'title':    db_video[1],
-                'duration': db_video[2],
-                'author':   db_video[3],
-            }
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+                                          FROM videos
+                                          INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
+                                          ORDER BY time_published DESC
+                                          LIMIT ? OFFSET ?''', (number, offset))
+
+            for db_video in db_videos:
+                yield {
+                    'id':   db_video[0],
+                    'title':    db_video[1],
+                    'duration': db_video[2],
+                    'author':   db_video[3],
+                }
 
 def _get_subscribed_channels():
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        for item in cursor.execute('''SELECT channel_name, yt_channel_id
-                                      FROM subscribed_channels
-                                      ORDER BY channel_name'''):
-            yield item
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
-
-def _add_tags(channel_ids, tags):
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
+    with open_database() as connection:
+        with connection as cursor:
+            for item in cursor.execute('''SELECT channel_name, yt_channel_id
+                                          FROM subscribed_channels
+                                          ORDER BY channel_name'''):
+                yield item
 
-        pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
-
-        cursor.executemany('''INSERT OR IGNORE INTO tag_associations (tag, sql_channel_id)
-                              SELECT ?, id FROM subscribed_channels WHERE yt_channel_id = ? ''', pairs)
-        connection.commit()
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
 
+def _add_tags(channel_ids, tags):
+    with open_database() as connection:
+        with connection as cursor:
+            pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
+            cursor.executemany('''INSERT OR IGNORE INTO tag_associations (tag, sql_channel_id)
+                                  SELECT ?, id FROM subscribed_channels WHERE yt_channel_id = ? ''', pairs)
 
 
 def _remove_tags(channel_ids, tags):
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
+    with open_database() as connection:
+        with connection as cursor:
+            pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
+            cursor.executemany('''DELETE FROM tag_associations
+                                  WHERE tag = ? AND sql_channel_id = (
+                                      SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                                   )''', pairs)
 
-        pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
-
-        cursor.executemany('''DELETE FROM tag_associations WHERE tag = ? AND sql_channel_id = (
-                                          SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
-                                      )''', pairs)
-        connection.commit()
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
 
 
 def _get_tags(channel_id):
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-
-        return [row[0] for row in cursor.execute('''SELECT tag
-                                      FROM tag_associations
-                                      WHERE sql_channel_id = (
-                                          SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
-                                      )''', (channel_id,))]
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            return [row[0] for row in cursor.execute('''SELECT tag
+                                                        FROM tag_associations
+                                                        WHERE sql_channel_id = (
+                                                            SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                                                        )''', (channel_id,))]
 
 def _get_all_tags():
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        return [row[0] for row in cursor.execute('''SELECT DISTINCT tag FROM tag_associations''')]
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            return [row[0] for row in cursor.execute('''SELECT DISTINCT tag FROM tag_associations''')]
 
 def _get_channel_names(channel_ids):
     ''' returns list of (channel_id, channel_name) '''
-    connection = open_database()
-    try:
-        cursor = connection.cursor()
-        result = []
-        for channel_id in channel_ids:
-            row = cursor.execute('''SELECT channel_name FROM subscribed_channels WHERE yt_channel_id = ?''', (channel_id,)).fetchone()
-            result.append( (channel_id, row[0]) )
-        return result
-    except:
-        connection.rollback()
-        raise
-    finally:
-        connection.close()
+    with open_database() as connection:
+        with connection as cursor:
+            result = []
+            for channel_id in channel_ids:
+                row = cursor.execute('''SELECT channel_name
+                                        FROM subscribed_channels
+                                        WHERE yt_channel_id = ?''', (channel_id,)).fetchone()
+                result.append( (channel_id, row[0]) )
+            return result
 
 
 units = {
@@ -464,20 +408,13 @@ def post_subscriptions_page(env, start_response):
         _unsubscribe(params['channel_id'])
 
     elif action == 'refresh':
-        connection = open_database()
-        try:
-            cursor = connection.cursor()
-            for sql_channel_id, yt_channel_id in cursor.execute('''SELECT id, yt_channel_id FROM subscribed_channels''').fetchall():
-                db_videos = ( (sql_channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(yt_channel_id) )
-                cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
-
-            cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
-            connection.commit()
-        except:
-            connection.rollback()
-            raise
-        finally:
-            connection.close()
+        with open_database() as connection:
+            with connection as cursor:
+                for sql_channel_id, yt_channel_id in cursor.execute('''SELECT id, yt_channel_id FROM subscribed_channels''').fetchall():
+                    db_videos = ( (sql_channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(yt_channel_id) )
+                    cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
+
+                cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
 
         start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscriptions'),] )
         return b''
-- 
cgit v1.2.3


From f5c76462d722d45645029754b4fc85252cf8212e Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 8 Jun 2019 02:35:21 -0700
Subject: Don't spam database with opening and closing when getting tags for
 many channels

---
 youtube/subscriptions.py | 30 +++++++++++++++---------------
 1 file changed, 15 insertions(+), 15 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index a3af40f..ff74d94 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -125,14 +125,12 @@ def _remove_tags(channel_ids, tags):
 
 
-def _get_tags(channel_id):
-    with open_database() as connection:
-        with connection as cursor:
-            return [row[0] for row in cursor.execute('''SELECT tag
-                                                        FROM tag_associations
-                                                        WHERE sql_channel_id = (
-                                                            SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
-                                                        )''', (channel_id,))]
+def _get_tags(cursor, channel_id):
+    return [row[0] for row in cursor.execute('''SELECT tag
+                                                FROM tag_associations
+                                                WHERE sql_channel_id = (
+                                                    SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                                                )''', (channel_id,))]
 
 def _get_all_tags():
     with open_database() as connection:
@@ -253,13 +251,15 @@ sub_list_item_template = Template('''
 def get_subscription_manager_page(env, start_response):
 
     sub_list_html = ''
-    for channel_name, channel_id in _get_subscribed_channels():
-        sub_list_html += sub_list_item_template.substitute(
-            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-            channel_name = html.escape(channel_name),
-            channel_id = channel_id,
-            tags = ', '.join(_get_tags(channel_id)),
-        )
+    with open_database() as connection:
+        with connection as cursor:
+            for channel_name, channel_id in _get_subscribed_channels():
+                sub_list_html += sub_list_item_template.substitute(
+                    channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                    channel_name = html.escape(channel_name),
+                    channel_id = channel_id,
+                    tags = ', '.join(_get_tags(cursor, channel_id)),
+                )
 
 
-- 
cgit v1.2.3


From 27ee2990e97b1e73df41c1512332a1facd56f759 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 9 Jun 2019 16:03:20 -0700
Subject: Overhaul refresh system, make it asynchronous

---
 youtube/subscriptions.py | 144 +++++++++++++++++++++++++++++++++++++++--------
 youtube/util.py          |  54 +++++++++++++++++-
 2 files changed, 171 insertions(+), 27 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index ff74d94..ba27655 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -26,7 +26,7 @@ database_path = os.path.join(settings.data_dir, "subscriptions.sqlite")
 def open_database():
     if not os.path.exists(settings.data_dir):
         os.makedirs(settings.data_dir)
-    connection = sqlite3.connect(database_path)
+    connection = sqlite3.connect(database_path, check_same_thread=False)
 
     # Create tables if they don't exist
     try:
@@ -172,17 +172,75 @@ def youtube_timestamp_to_posix(dumb_timestamp):
         unit = unit[:-1]    # remove s from end
     return now - number*units[unit]
 
+
+try:
+    existing_thumbnails = set(os.path.splitext(name)[0] for name in os.listdir(thumbnails_directory))
+except FileNotFoundError:
+    existing_thumbnails = set()
+
+
+thumbnails_queue = util.RateLimitedQueue()
+check_channels_queue = util.RateLimitedQueue()
+
+
 # Use this to mark a thumbnail acceptable to be retrieved at the request of the browser
+# can't simply check if it's in the queue because items are removed when the download starts, not when it finishes
 downloading_thumbnails = set()
-def download_thumbnails(thumbnails_directory, thumbnails):
-    try:
-        g = gevent.spawn(util.download_thumbnails, thumbnails_directory, thumbnails)
-        g.join()
-    finally:
-        downloading_thumbnails.difference_update(thumbnails)
+
+checking_channels = set()
+
+# Just to use for printing channel checking status to console without opening database
+channel_names = dict()
+
+def download_thumbnail_worker():
+    while True:
+        video_id = thumbnails_queue.get()
+        try:
+            success = util.download_thumbnail(thumbnails_directory, video_id)
+            if success:
+                existing_thumbnails.add(video_id)
+        except Exception:
+            traceback.print_exc()
+        finally:
+            downloading_thumbnails.remove(video_id)
+
+def check_channel_worker():
+    while True:
+        channel_id = check_channels_queue.get()
+        try:
+            _get_upstream_videos(channel_id)
+        finally:
+            checking_channels.remove(channel_id)
+
+for i in range(0,5):
+    gevent.spawn(download_thumbnail_worker)
+    gevent.spawn(check_channel_worker)
+
+
+
+
+
+
+def download_thumbnails_if_necessary(thumbnails):
+    for video_id in thumbnails:
+        if video_id not in existing_thumbnails and video_id not in downloading_thumbnails:
+            downloading_thumbnails.add(video_id)
+            thumbnails_queue.put(video_id)
+
+def check_channels_if_necessary(channel_ids):
+    for channel_id in channel_ids:
+        if channel_id not in checking_channels:
+            checking_channels.add(channel_id)
+            check_channels_queue.put(channel_id)
+
 
 
 def _get_upstream_videos(channel_id):
+    try:
+        print("Checking channel: " + channel_names[channel_id])
+    except KeyError:
+        print("Checking channel " + channel_id)
+
     videos = []
 
     json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
@@ -190,23 +248,56 @@ def _get_upstream_videos(channel_id):
         info = yt_data_extract.renderer_info(json_video['gridVideoRenderer'])
         if 'description' not in info:
             info['description'] = ''
-        info['time_published'] = youtube_timestamp_to_posix(info['published']) - i  # subtract a few seconds off the videos so they will be in the right order
-        videos.append(info)
+        try:
+            info['time_published'] = youtube_timestamp_to_posix(info['published']) - i  # subtract a few seconds off the videos so they will be in the right order
+        except KeyError:
+            print(info)
+        videos.append((channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']))
+
+    now = time.time()
+    download_thumbnails_if_necessary(video[1] for video in videos if (now - video[4]) < 30*24*3600) # Don't download thumbnails from videos older than a month
+
+    with open_database() as connection:
+        with connection as cursor:
+            cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description)
+                                  VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?)''', videos)
+            cursor.execute('''UPDATE subscribed_channels
+                              SET time_last_checked = ?
+                              WHERE yt_channel_id=?''', [int(time.time()), channel_id])
 
-    try:
-        existing_thumbnails = set(os.path.splitext(name)[0] for name in os.listdir(thumbnails_directory))
-    except FileNotFoundError:
-        existing_thumbnails = set()
-    missing_thumbnails = set(video['id'] for video in videos) - existing_thumbnails
-    downloading_thumbnails.update(missing_thumbnails)
-    gevent.spawn(download_thumbnails, thumbnails_directory, missing_thumbnails)
 
-    return videos
+def check_all_channels():
+    with open_database() as connection:
+        with connection as cursor:
+            channel_id_name_list = cursor.execute('''SELECT yt_channel_id, channel_name FROM subscribed_channels''').fetchall()
 
+    channel_names.update(channel_id_name_list)
+    check_channels_if_necessary([item[0] for item in channel_id_name_list])
 
 
+def check_tags(tags):
+    channel_id_name_list = []
+    with open_database() as connection:
+        with connection as cursor:
+            for tag in tags:
+                channel_id_name_list += cursor.execute('''SELECT yt_channel_id, channel_name
+                                                          FROM subscribed_channels
+                                                          WHERE subscribed_channels.id IN (
+                                                              SELECT tag_associations.sql_channel_id FROM tag_associations WHERE tag=?
+                                                          )''', [tag]).fetchall()
+    channel_names.update(channel_id_name_list)
+    check_channels_if_necessary([item[0] for item in channel_id_name_list])
 
 
+def check_specific_channels(channel_ids):
+    with open_database() as connection:
+        with connection as cursor:
+            for channel_id in channel_ids:
+                channel_id_name_list += cursor.execute('''SELECT yt_channel_id, channel_name
+                                                          FROM subscribed_channels
+                                                          WHERE yt_channel_id=?''', [channel_id]).fetchall()
+    channel_names.update(channel_id_name_list)
+    check_channels_if_necessary(channel_ids)
 
 
@@ -408,15 +499,18 @@ def post_subscriptions_page(env, start_response):
         _unsubscribe(params['channel_id'])
 
     elif action == 'refresh':
-        with open_database() as connection:
-            with connection as cursor:
-                for sql_channel_id, yt_channel_id in cursor.execute('''SELECT id, yt_channel_id FROM subscribed_channels''').fetchall():
-                    db_videos = ( (sql_channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']) for info in _get_upstream_videos(yt_channel_id) )
-                    cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description) VALUES (?, ?, ?, ?, ?, ?)''', db_videos)
-
-                cursor.execute('''UPDATE subscribed_channels SET time_last_checked = ?''', ( int(time.time()), ) )
+        type = params['type'][0]
+        if type == 'all':
+            check_all_channels()
+        elif type == 'tag':
+            check_tags(params['tag_name'])
+        elif type == 'channel':
+            check_specific_channels(params['channel_id'])
+        else:
+            start_response('400 Bad Request', ())
+            return b'400 Bad Request'
 
-        start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscriptions'),] )
+        start_response('204 No Content', ())
         return b''
     else:
         start_response('400 Bad Request', ())
diff --git a/youtube/util.py b/youtube/util.py
index 42d76a3..c4e1aff 100644
--- a/youtube/util.py
+++ b/youtube/util.py
@@ -7,6 +7,8 @@ import re
 import time
 import os
 import gevent
+import gevent.queue
+import gevent.lock
 
 # The trouble with the requests library: It ships its own certificate bundle via certifi
 #  instead of using the system certificate store, meaning self-signed certificates
@@ -176,6 +178,53 @@ desktop_ua = (('User-Agent', desktop_user_agent),)
 
 
+class RateLimitedQueue(gevent.queue.Queue):
+    ''' Does initial_burst (def. 30) at first, then alternates between waiting waiting_period (def. 5) seconds and doing subsequent_bursts (def. 10) queries. After 5 seconds with nothing left in the queue, resets rate limiting. '''
+
+    def __init__(self, initial_burst=30, waiting_period=5, subsequent_bursts=10):
+        self.initial_burst = initial_burst
+        self.waiting_period = waiting_period
+        self.subsequent_bursts = subsequent_bursts
+
+        self.count_since_last_wait = 0
+        self.surpassed_initial = False
+
+        self.lock = gevent.lock.BoundedSemaphore(1)
+        self.currently_empty = False
+        self.empty_start = 0
+        gevent.queue.Queue.__init__(self)
+
+
+    def get(self):
+        self.lock.acquire()     # blocks if another greenlet currently has the lock
+        if self.count_since_last_wait >= self.subsequent_bursts and self.surpassed_initial:
+            gevent.sleep(self.waiting_period)
+            self.count_since_last_wait = 0
+
+        elif self.count_since_last_wait >= self.initial_burst and not self.surpassed_initial:
+            self.surpassed_initial = True
+            gevent.sleep(self.waiting_period)
+            self.count_since_last_wait = 0
+
+        self.count_since_last_wait += 1
+
+        if not self.currently_empty and self.empty():
+            self.currently_empty = True
+            self.empty_start = time.monotonic()
+
+        item = gevent.queue.Queue.get(self)     # blocks when nothing left
+
+        if self.currently_empty:
+            if time.monotonic() - self.empty_start >= self.waiting_period:
+                self.count_since_last_wait = 0
+                self.surpassed_initial = False
+
+            self.currently_empty = False
+
+        self.lock.release()
+
+        return item
+
 
 
 def download_thumbnail(save_directory, video_id):
@@ -185,14 +234,15 @@ def download_thumbnail(save_directory, video_id):
         thumbnail = fetch_url(url, report_text="Saved thumbnail: " + video_id)
     except urllib.error.HTTPError as e:
         print("Failed to download thumbnail for " + video_id + ": " + str(e))
-        return
+        return False
     try:
         f = open(save_location, 'wb')
     except FileNotFoundError:
-        os.makedirs(save_directory)
+        os.makedirs(save_directory, exist_ok = True)
         f = open(save_location, 'wb')
     f.write(thumbnail)
     f.close()
+    return True
 
 def download_thumbnails(save_directory, ids):
     if not isinstance(ids, (list, tuple)):
-- 
cgit v1.2.3


From 83f3dfaff54e27f59153980466685e77c4bf12cb Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 9 Jun 2019 18:01:46 -0700
Subject: simplify list_from_comma_separated_tags

---
 youtube/subscriptions.py | 16 +---------------
 1 file changed, 1 insertion(+), 15 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index ba27655..be4ea1d 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -362,21 +362,7 @@ def get_subscription_manager_page(env, start_response):
     ).encode('utf-8')
 
 def list_from_comma_separated_tags(string):
-    tags = []
-    prev_comma = -1
-    next_comma = string.find(',')
-    while next_comma != -1:
-        tag = string[prev_comma+1:next_comma].strip()
-        if tag:
-            tags.append(tag)
-
-        prev_comma = next_comma
-        next_comma = string.find(',', prev_comma+1)
-
-    last_tag = string[prev_comma+1:].strip()
-    if last_tag:
-        tags.append(last_tag)
-    return tags
+    return [tag.strip() for tag in string.split(',') if tag.strip()]
 
 
 unsubscribe_list_item_template = Template('''
-- 
cgit v1.2.3


From f1cd3eb7519b10e55bb0a9780d34c1493efca176 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 9 Jun 2019 20:23:59 -0700
Subject: Support opml for subscriptions import

---
 youtube/subscriptions.py | 22 +++++++++++++++++++++-
 1 file changed, 21 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index be4ea1d..d43c8fd 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -9,6 +9,7 @@ import html
 import json
 import traceback
 import contextlib
+import defusedxml.ElementTree
 
 with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
     subscriptions_template = Template(f.read())
@@ -322,8 +323,27 @@ def import_subscriptions(env, start_response):
             traceback.print_exc()
             start_response('400 Bad Request', () )
             return b'400 Bad Request: Unknown json structure'
+    elif content_type in ('application/xml', 'text/xml', 'text/x-opml'):
+        try:
+            root = defusedxml.ElementTree.fromstring(file)
+            assert root.tag == 'opml'
+            channels = []
+            for outline_element in root[0][0]:
+                if (outline_element.tag != 'outline') or ('xmlUrl' not in outline_element.attrib):
+                    continue
+
+
+                channel_name = outline_element.attrib['text']
+                channel_rss_url = outline_element.attrib['xmlUrl']
+                channel_id = channel_rss_url[channel_rss_url.find('channel_id=')+11:].strip()
+                channels.append( (channel_id, channel_name) )
+
+        except (AssertionError, IndexError, defusedxml.ElementTree.ParseError) as e:
+            start_response('400 Bad Request', () )
+            return b'400 Bad Request: Unable to read opml xml file, or the file is not the expected format'
     else:
-        raise NotImplementedError()
+            start_response('400 Bad Request', () )
+            return b'400 Bad Request: Unsupported file format: ' + html.escape(content_type).encode('utf-8') + b'. Only subscription.json files (from Google Takeouts) and XML OPML files exported from Youtube\'s subscription manager page are supported'
 
     _subscribe(channels)
 
-- 
cgit v1.2.3


From d637f5b29c2153b0e4fde2f7183230100b2f6309 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 10 Jun 2019 02:29:55 -0700
Subject: Group by tags feature and improve appearance of sub list items

---
 youtube/subscriptions.py | 101 +++++++++++++++++++++++++++++++++++++++--------
 1 file changed, 85 insertions(+), 16 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index d43c8fd..7728c0c 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -151,6 +151,21 @@ def _get_channel_names(channel_ids):
             return result
 
 
+def _channels_with_tag(cursor, tag, order=False):
+    ''' returns list of (channel_id, channel_name) '''
+
+    statement = '''SELECT yt_channel_id, channel_name
+                   FROM subscribed_channels
+                   WHERE subscribed_channels.id IN (
+                       SELECT tag_associations.sql_channel_id FROM tag_associations WHERE tag=?
+                   )
+                '''
+    if order:
+        statement += '''ORDER BY channel_name'''
+
+    return cursor.execute(statement, [tag]).fetchall()
+
+
 units = {
     'year': 31536000,   # 365*24*3600
     'month': 2592000,   # 30*24*3600
@@ -281,11 +296,8 @@ def check_tags(tags):
     with open_database() as connection:
         with connection as cursor:
             for tag in tags:
-                channel_id_name_list += cursor.execute('''SELECT yt_channel_id, channel_name
-                                                          FROM subscribed_channels
-                                                          WHERE subscribed_channels.id IN (
-                                                              SELECT tag_associations.sql_channel_id FROM tag_associations WHERE tag=?
-                                                          )''', [tag]).fetchall()
+                channel_id_name_list += _channels_with_tag(cursor, tag)
+
     channel_names.update(channel_id_name_list)
     check_channels_if_necessary([item[0] for item in channel_id_name_list])
 
@@ -354,30 +366,87 @@ def import_subscriptions(env, start_response):
 
 sub_list_item_template = Template('''
 <li>
+    <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
     <a href="$channel_url" class="sub-list-item-name" title="$channel_name">$channel_name</a>
     <span class="tag-list">$tags</span>
-    <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
 </li>''')
 
+tag_group_template = Template('''
+<li class="tag-group">
+    <h2 class="tag-group-name">$tag</h2>
+    <ol class="sub-list">
+$sub_list
+    </ol>
+</li>
+''')
 def get_subscription_manager_page(env, start_response):
-
-    sub_list_html = ''
     with open_database() as connection:
         with connection as cursor:
-            for channel_name, channel_id in _get_subscribed_channels():
-                sub_list_html += sub_list_item_template.substitute(
-                    channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                    channel_name = html.escape(channel_name),
-                    channel_id = channel_id,
-                    tags = ', '.join(_get_tags(cursor, channel_id)),
-                )
+            if env['parameters'].get('group_by_tags', '0')[0] == '1':
+
+                sort_name = "Don't group"
+                sort_link = util.URL_ORIGIN + '/subscription_manager'
+
+                main_list_html = '<ul class="tag-group-list">'
+                for tag in _get_all_tags():
+                    sub_list_html = ''
+                    for channel_id, channel_name in _channels_with_tag(cursor, tag, order=True):
+                        sub_list_html += sub_list_item_template.substitute(
+                            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                            channel_name = html.escape(channel_name),
+                            channel_id = channel_id,
+                            tags = ', '.join(t for t in _get_tags(cursor, channel_id) if t != tag),
+                        )
+                    main_list_html += tag_group_template.substitute(
+                        tag = tag,
+                        sub_list = sub_list_html,
+                    )
+
+                # Channels with no tags
+                channel_list = cursor.execute('''SELECT yt_channel_id, channel_name
+                                                 FROM subscribed_channels
+                                                 WHERE id NOT IN (
+                                                     SELECT sql_channel_id FROM tag_associations
+                                                 )
+                                                 ORDER BY channel_name''').fetchall()
+                if channel_list:
+                    sub_list_html = ''
+                    for channel_id, channel_name in channel_list:
+                        sub_list_html += sub_list_item_template.substitute(
+                            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                            channel_name = html.escape(channel_name),
+                            channel_id = channel_id,
+                            tags = '',
+                        )
+                    main_list_html += tag_group_template.substitute(
+                        tag = "No tags",
+                        sub_list = sub_list_html,
+                    )
+                main_list_html += '</ul>'
+
+            else:
+
+                sort_name = "Group by tags"
+                sort_link = util.URL_ORIGIN + '/subscription_manager?group_by_tags=1'
+
+                main_list_html = '<ol class="sub-list">'
+                for channel_name, channel_id in _get_subscribed_channels():
+                    main_list_html += sub_list_item_template.substitute(
+                        channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                        channel_name = html.escape(channel_name),
+                        channel_id = channel_id,
+                        tags = ', '.join(_get_tags(cursor, channel_id)),
+                    )
+                main_list_html += '</ol>'
 
 
     start_response('200 OK', [('Content-type','text/html'),])
     return subscription_manager_template.substitute(
         header = html_common.get_header(),
-        sub_list = sub_list_html,
+        main_list = main_list_html,
+        sort_name = sort_name,
+        sort_link = sort_link,
         page_buttons = '',
     ).encode('utf-8')
 
-- 
cgit v1.2.3


From 9da073000a54fba8f6d38dc37bfcfd9ca0a60d9a Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 10 Jun 2019 15:27:17 -0700
Subject: Use a single cursor for db operations when possible instead of
 reopening multiple times

---
 youtube/subscriptions.py | 168 ++++++++++++++++++++++-------------------------
 1 file changed, 80 insertions(+), 88 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 7728c0c..5707286 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -63,66 +63,60 @@ def open_database():
     # https://stackoverflow.com/questions/19522505/using-sqlite3-in-python-with-with-keyword
     return contextlib.closing(connection)
 
-def _subscribe(channels):
+def with_open_db(function, *args, **kwargs):
+    with open_database() as connection:
+        with connection as cursor:
+            return function(cursor, *args, **kwargs)
+
+
+def _subscribe(cursor, channels):
     ''' channels is a list of (channel_id, channel_name) '''
 
     # set time_last_checked to 0 on all channels being subscribed to
     channels = ( (channel_id, channel_name, 0) for channel_id, channel_name in channels)
 
-    with open_database() as connection:
-        with connection as cursor:
-            cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked)
-                                  VALUES (?, ?, ?)''', channels)
+    cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked)
+                          VALUES (?, ?, ?)''', channels)
 
 # TODO: delete thumbnails
-def _unsubscribe(channel_ids):
+def _unsubscribe(cursor, channel_ids):
     ''' channel_ids is a list of channel_ids '''
-    with open_database() as connection:
-        with connection as cursor:
-            cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
+    cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
 
-def _get_videos(number, offset):
-    with open_database() as connection:
-        with connection as cursor:
-            db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
-                                          FROM videos
-                                          INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
-                                          ORDER BY time_published DESC
-                                          LIMIT ? OFFSET ?''', (number, offset))
-
-            for db_video in db_videos:
-                yield {
-                    'id':   db_video[0],
-                    'title':    db_video[1],
-                    'duration': db_video[2],
-                    'author':   db_video[3],
-                }
-
-def _get_subscribed_channels():
-    with open_database() as connection:
-        with connection as cursor:
-            for item in cursor.execute('''SELECT channel_name, yt_channel_id
-                                          FROM subscribed_channels
-                                          ORDER BY channel_name'''):
-                yield item
+def _get_videos(cursor, number, offset):
+    db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+                                  FROM videos
+                                  INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
+                                  ORDER BY time_published DESC
+                                  LIMIT ? OFFSET ?''', (number, offset))
 
+    for db_video in db_videos:
+        yield {
+            'id':   db_video[0],
+            'title':    db_video[1],
+            'duration': db_video[2],
+            'author':   db_video[3],
+        }
 
-def _add_tags(channel_ids, tags):
-    with open_database() as connection:
-        with connection as cursor:
-            pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
-            cursor.executemany('''INSERT OR IGNORE INTO tag_associations (tag, sql_channel_id)
-                                  SELECT ?, id FROM subscribed_channels WHERE yt_channel_id = ? ''', pairs)
+def _get_subscribed_channels(cursor):
+    for item in cursor.execute('''SELECT channel_name, yt_channel_id
+                                  FROM subscribed_channels
+                                  ORDER BY channel_name'''):
+        yield item
 
 
-def _remove_tags(channel_ids, tags):
-    with open_database() as connection:
-        with connection as cursor:
-            pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
-            cursor.executemany('''DELETE FROM tag_associations
-                                  WHERE tag = ? AND sql_channel_id = (
-                                      SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
-                                   )''', pairs)
+def _add_tags(cursor, channel_ids, tags):
+    pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
+    cursor.executemany('''INSERT OR IGNORE INTO tag_associations (tag, sql_channel_id)
+                          SELECT ?, id FROM subscribed_channels WHERE yt_channel_id = ? ''', pairs)
+
+
+def _remove_tags(cursor, channel_ids, tags):
+    pairs = [(tag, yt_channel_id) for tag in tags for yt_channel_id in channel_ids]
+    cursor.executemany('''DELETE FROM tag_associations
+                          WHERE tag = ? AND sql_channel_id = (
+                              SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
+                           )''', pairs)
 
 
@@ -133,22 +127,18 @@ def _get_tags(cursor, channel_id):
                                                     SELECT id FROM subscribed_channels WHERE yt_channel_id = ?
                                                 )''', (channel_id,))]
 
-def _get_all_tags():
-    with open_database() as connection:
-        with connection as cursor:
-            return [row[0] for row in cursor.execute('''SELECT DISTINCT tag FROM tag_associations''')]
+def _get_all_tags(cursor):
+    return [row[0] for row in cursor.execute('''SELECT DISTINCT tag FROM tag_associations''')]
 
-def _get_channel_names(channel_ids):
+def _get_channel_names(cursor, channel_ids):
     ''' returns list of (channel_id, channel_name) '''
-    with open_database() as connection:
-        with connection as cursor:
-            result = []
-            for channel_id in channel_ids:
-                row = cursor.execute('''SELECT channel_name
-                                        FROM subscribed_channels
-                                        WHERE yt_channel_id = ?''', (channel_id,)).fetchone()
-                result.append( (channel_id, row[0]) )
-            return result
+    result = []
+    for channel_id in channel_ids:
+        row = cursor.execute('''SELECT channel_name
+                                FROM subscribed_channels
+                                WHERE yt_channel_id = ?''', (channel_id,)).fetchone()
+        result.append( (channel_id, row[0]) )
+    return result
 
 
 def _channels_with_tag(cursor, tag, order=False):
@@ -357,7 +347,7 @@ def import_subscriptions(env, start_response):
             start_response('400 Bad Request', () )
             return b'400 Bad Request: Unsupported file format: ' + html.escape(content_type).encode('utf-8') + b'. Only subscription.json files (from Google Takeouts) and XML OPML files exported from Youtube\'s subscription manager page are supported'
 
-    _subscribe(channels)
+    with_open_db(_subscribe, channels)
 
     start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
     return b''
@@ -388,7 +378,7 @@ def get_subscription_manager_page(env, start_response):
                 sort_link = util.URL_ORIGIN + '/subscription_manager'
 
                 main_list_html = '<ul class="tag-group-list">'
-                for tag in _get_all_tags():
+                for tag in _get_all_tags(cursor):
                     sub_list_html = ''
                     for channel_id, channel_name in _channels_with_tag(cursor, tag, order=True):
                         sub_list_html += sub_list_item_template.substitute(
@@ -430,7 +420,7 @@ def get_subscription_manager_page(env, start_response):
                 sort_link = util.URL_ORIGIN + '/subscription_manager?group_by_tags=1'
 
                 main_list_html = '<ol class="sub-list">'
-                for channel_name, channel_id in _get_subscribed_channels():
+                for channel_name, channel_id in _get_subscribed_channels(cursor):
                     main_list_html += sub_list_item_template.substitute(
                         channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                         channel_name = html.escape(channel_name),
@@ -461,11 +451,11 @@ def post_subscription_manager_page(env, start_response):
     action = params['action'][0]
 
     if action == 'add_tags':
-        _add_tags(params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+        with_open_db(_add_tags, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
     elif action == 'remove_tags':
-        _remove_tags(params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+        with_open_db(_remove_tags, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
     elif action == 'unsubscribe':
-        _unsubscribe(params['channel_ids'])
+        with_open_db(_unsubscribe, params['channel_ids'])
     elif action == 'unsubscribe_verify':
         page = '''
         <span>Are you sure you want to unsubscribe from these channels?</span>
@@ -479,7 +469,7 @@ def post_subscription_manager_page(env, start_response):
             <input type="submit" value="Yes, unsubscribe">
         </form>
         <ul>'''
-        for channel_id, channel_name in _get_channel_names(params['channel_ids']):
+        for channel_id, channel_name in with_open_db(_get_channel_names, params['channel_ids']):
             page += unsubscribe_list_item_template.substitute(
                 channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                 channel_name = html.escape(channel_name),
@@ -526,29 +516,31 @@ sidebar_channel_item_template = Template('''
 </li>''')
 
 def get_subscriptions_page(env, start_response):
-    items_html = '''<nav class="item-grid">\n'''
+    with open_database() as connection:
+        with connection as cursor:
+            items_html = '''<nav class="item-grid">\n'''
 
-    for item in _get_videos(30, 0):
-        if item['id'] in downloading_thumbnails:
-            item['thumbnail'] = util.get_thumbnail_url(item['id'])
-        else:
-            item['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + item['id'] + '.jpg'
-        items_html += html_common.video_item_html(item, html_common.small_video_item_template)
-    items_html += '''\n</nav>'''
+            for item in _get_videos(cursor, 30, 0):
+                if item['id'] in downloading_thumbnails:
+                    item['thumbnail'] = util.get_thumbnail_url(item['id'])
+                else:
+                    item['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + item['id'] + '.jpg'
+                items_html += html_common.video_item_html(item, html_common.small_video_item_template)
+            items_html += '''\n</nav>'''
 
 
-    tag_list_html = ''
-    for tag_name in _get_all_tags():
-        tag_list_html += sidebar_tag_item_template.substitute(tag_name = tag_name)
+            tag_list_html = ''
+            for tag_name in _get_all_tags(cursor):
+                tag_list_html += sidebar_tag_item_template.substitute(tag_name = tag_name)
 
 
-    sub_list_html = ''
-    for channel_name, channel_id in _get_subscribed_channels():
-        sub_list_html += sidebar_channel_item_template.substitute(
-            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-            channel_name = html.escape(channel_name),
-            channel_id = channel_id,
-        )
+            sub_list_html = ''
+            for channel_name, channel_id in _get_subscribed_channels(cursor):
+                sub_list_html += sidebar_channel_item_template.substitute(
+                    channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                    channel_name = html.escape(channel_name),
+                    channel_id = channel_id,
+                )
 
 
@@ -568,10 +560,10 @@ def post_subscriptions_page(env, start_response):
         if len(params['channel_id']) != len(params['channel_name']):
             start_response('400 Bad Request', ())
             return b'400 Bad Request, length of channel_id != length of channel_name'
-        _subscribe(zip(params['channel_id'], params['channel_name']))
+        with_open_db(_subscribe, zip(params['channel_id'], params['channel_name']))
 
     elif action == 'unsubscribe':
-        _unsubscribe(params['channel_id'])
+        with_open_db(_unsubscribe, params['channel_id'])
 
     elif action == 'refresh':
         type = params['type'][0]
-- 
cgit v1.2.3


From 8539b48c7b858b826a660bd606149f8b84e72a84 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 10 Jun 2019 15:28:29 -0700
Subject: Retrieve 60 videos for subscriptions page instead of 30

---
 youtube/subscriptions.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 5707286..45a34b5 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -520,7 +520,7 @@ def get_subscriptions_page(env, start_response):
         with connection as cursor:
             items_html = '''<nav class="item-grid">\n'''
 
-            for item in _get_videos(cursor, 30, 0):
+            for item in _get_videos(cursor, 60, 0):
                 if item['id'] in downloading_thumbnails:
                     item['thumbnail'] = util.get_thumbnail_url(item['id'])
                 else:
-- 
cgit v1.2.3


From e7989db931132f71c54b8924e5194410cc7f9bbc Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 10 Jun 2019 15:36:53 -0700
Subject: Order channel names in a case-insensitive manner

---
 youtube/subscriptions.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 45a34b5..b6a4e0e 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -101,7 +101,7 @@ def _get_videos(cursor, number, offset):
 def _get_subscribed_channels(cursor):
     for item in cursor.execute('''SELECT channel_name, yt_channel_id
                                   FROM subscribed_channels
-                                  ORDER BY channel_name'''):
+                                  ORDER BY channel_name COLLATE NOCASE'''):
         yield item
 
 
@@ -151,7 +151,7 @@ def _channels_with_tag(cursor, tag, order=False):
                    )
                 '''
     if order:
-        statement += '''ORDER BY channel_name'''
+        statement += '''ORDER BY channel_name COLLATE NOCASE'''
 
     return cursor.execute(statement, [tag]).fetchall()
 
@@ -398,7 +398,7 @@ def get_subscription_manager_page(env, start_response):
                                                  WHERE id NOT IN (
                                                      SELECT sql_channel_id FROM tag_associations
                                                  )
-                                                 ORDER BY channel_name''').fetchall()
+                                                 ORDER BY channel_name COLLATE NOCASE''').fetchall()
                 if channel_list:
                     sub_list_html = ''
                     for channel_id, channel_name in channel_list:
-- 
cgit v1.2.3


From 103b37030fcd073b5f44b9ddc79da0ce15325a96 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 10 Jun 2019 17:04:06 -0700
Subject: Unsubscribe button on channels if already subscribed

---
 youtube/channel.py       | 44 +++++++++++++++++++++++++++++++++++++++++---
 youtube/subscriptions.py | 14 ++++++++++++++
 2 files changed, 55 insertions(+), 3 deletions(-)

(limited to 'youtube')

diff --git a/youtube/channel.py b/youtube/channel.py
index 55316e2..1b345b5 100644
--- a/youtube/channel.py
+++ b/youtube/channel.py
@@ -1,5 +1,5 @@
 import base64
-from youtube import util, yt_data_extract, html_common
+from youtube import util, yt_data_extract, html_common, subscriptions
 
 import http_errors
 import urllib
@@ -241,6 +241,12 @@ def channel_videos_html(polymer_json, current_page=1, current_sort=3, number_of_
     microformat = get_microformat(response)
     channel_url = microformat['urlCanonical'].rstrip('/')
     channel_id = channel_url[channel_url.rfind('/')+1:]
+    if subscriptions.is_subscribed(channel_id):
+        action_name = 'Unsubscribe'
+        action = 'unsubscribe'
+    else:
+        action_name = 'Subscribe'
+        action = 'subscribe'
 
     items = get_grid_items(response)
     items_html = grid_items_html(items, {'author': microformat['title']})
@@ -256,6 +262,8 @@ def channel_videos_html(polymer_json, current_page=1, current_sort=3, number_of_
         items               = items_html,
         page_buttons        = html_common.page_buttons_html(current_page, math.ceil(number_of_videos/30), util.URL_ORIGIN + "/channel/" + channel_id + "/videos", current_query_string),
         number_of_results   = '{:,}'.format(number_of_videos) + " videos",
+        action_name = action_name,
+        action = action,
     )
 
 def channel_playlists_html(polymer_json, current_sort=3):
@@ -264,6 +272,13 @@ def channel_playlists_html(polymer_json, current_sort=3):
     channel_url = microformat['urlCanonical'].rstrip('/')
     channel_id = channel_url[channel_url.rfind('/')+1:]
 
+    if subscriptions.is_subscribed(channel_id):
+        action_name = 'Unsubscribe'
+        action = 'unsubscribe'
+    else:
+        action_name = 'Subscribe'
+        action = 'subscribe'
+
     items = get_grid_items(response)
     items_html = grid_items_html(items, {'author': microformat['title']})
     
@@ -278,6 +293,8 @@ def channel_playlists_html(polymer_json, current_sort=3):
         items               = items_html,
         page_buttons        = '',
         number_of_results   = '',
+        action_name = action_name,
+        action = action,
     )
 
 # Example channel where tabs do not have definite index: https://www.youtube.com/channel/UC4gQ8i3FD7YbhOgqUkeQEJg
@@ -323,6 +340,16 @@ def channel_about_page(polymer_json):
             continue
         else:
             stats += stat_template.substitute(stat_value=stat_value)
+
+
+    channel_id = channel_metadata['channelId']
+    if subscriptions.is_subscribed(channel_id):
+        action_name = 'Unsubscribe'
+        action = 'unsubscribe'
+    else:
+        action_name = 'Subscribe'
+        action = 'subscribe'
+
     try:
         description = yt_data_extract.format_text_runs(yt_data_extract.get_formatted_text(channel_metadata['description']))
     except KeyError:
@@ -335,8 +362,10 @@ def channel_about_page(polymer_json):
         description         = description,
         links               = channel_links,
         stats               = stats,
-        channel_id          = channel_metadata['channelId'],
+        channel_id          = channel_id,
         channel_tabs        = channel_tabs_html(channel_metadata['channelId'], 'About'),
+        action_name = action_name,
+        action = action,
     )
 
 def channel_search_page(polymer_json, query, current_page=1, number_of_videos = 1000, current_query_string=''):
@@ -345,7 +374,14 @@ def channel_search_page(polymer_json, query, current_page=1, number_of_videos =
     channel_url = microformat['urlCanonical'].rstrip('/')
     channel_id = channel_url[channel_url.rfind('/')+1:]
 
-    
+    if subscriptions.is_subscribed(channel_id):
+        action_name = 'Unsubscribe'
+        action = 'unsubscribe'
+    else:
+        action_name = 'Subscribe'
+        action = 'subscribe'
+
+
     try:
         items = tab_with_content(response['contents']['twoColumnBrowseResultsRenderer']['tabs'])['sectionListRenderer']['contents']
     except KeyError:
@@ -364,6 +400,8 @@ def channel_search_page(polymer_json, query, current_page=1, number_of_videos =
         page_buttons        = html_common.page_buttons_html(current_page, math.ceil(number_of_videos/29), util.URL_ORIGIN + "/channel/" + channel_id + "/search", current_query_string),
         number_of_results   = '',
         sort_buttons        = '',
+        action_name = action_name,
+        action = action,
     )
 def get_channel_search_json(channel_id, query, page):
     params = proto.string(2, 'search') + proto.string(15, str(page))
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index b6a4e0e..e12fa0b 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -68,6 +68,20 @@ def with_open_db(function, *args, **kwargs):
         with connection as cursor:
             return function(cursor, *args, **kwargs)
 
+def is_subscribed(channel_id):
+    if not os.path.exists(database_path):
+        return False
+
+    with open_database() as connection:
+        with connection as cursor:
+            result = cursor.execute('''SELECT EXISTS(
+                                           SELECT 1
+                                           FROM subscribed_channels
+                                           WHERE yt_channel_id=?
+                                           LIMIT 1
+                                       )''', [channel_id]).fetchone()
+            return bool(result[0])
+
 
 def _subscribe(cursor, channels):
     ''' channels is a list of (channel_id, channel_name) '''
-- 
cgit v1.2.3


From 59fdbda886c1bc1acc12da7061b0710b048ce252 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Tue, 11 Jun 2019 01:47:06 -0700
Subject: Add channel muting

---
 youtube/subscriptions.py | 126 ++++++++++++++++++++++++++++-------------------
 1 file changed, 76 insertions(+), 50 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index e12fa0b..5d049be 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -36,7 +36,9 @@ def open_database():
                               id integer PRIMARY KEY,
                               yt_channel_id text UNIQUE NOT NULL,
                               channel_name text NOT NULL,
-                              time_last_checked integer
+                              time_last_checked integer,
+                              muted integer DEFAULT 0,
+                              upload_frequency integer
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
                               id integer PRIMARY KEY,
@@ -113,7 +115,7 @@ def _get_videos(cursor, number, offset):
         }
 
 def _get_subscribed_channels(cursor):
-    for item in cursor.execute('''SELECT channel_name, yt_channel_id
+    for item in cursor.execute('''SELECT channel_name, yt_channel_id, muted
                                   FROM subscribed_channels
                                   ORDER BY channel_name COLLATE NOCASE'''):
         yield item
@@ -155,15 +157,22 @@ def _get_channel_names(cursor, channel_ids):
     return result
 
 
-def _channels_with_tag(cursor, tag, order=False):
+def _channels_with_tag(cursor, tag, order=False, exclude_muted=False, include_muted_status=False):
     ''' returns list of (channel_id, channel_name) '''
 
-    statement = '''SELECT yt_channel_id, channel_name
+    statement = '''SELECT yt_channel_id, channel_name'''
+
+    if include_muted_status:
+        statement += ''', muted'''
+
+    statement += '''
                    FROM subscribed_channels
                    WHERE subscribed_channels.id IN (
                        SELECT tag_associations.sql_channel_id FROM tag_associations WHERE tag=?
                    )
                 '''
+    if exclude_muted:
+        statement += '''AND muted != 1\n'''
     if order:
         statement += '''ORDER BY channel_name COLLATE NOCASE'''
 
@@ -289,7 +298,9 @@ def _get_upstream_videos(channel_id):
 def check_all_channels():
     with open_database() as connection:
         with connection as cursor:
-            channel_id_name_list = cursor.execute('''SELECT yt_channel_id, channel_name FROM subscribed_channels''').fetchall()
+            channel_id_name_list = cursor.execute('''SELECT yt_channel_id, channel_name
+                                                     FROM subscribed_channels
+                                                     WHERE muted != 1''').fetchall()
 
     channel_names.update(channel_id_name_list)
     check_channels_if_necessary([item[0] for item in channel_id_name_list])
@@ -300,7 +311,7 @@ def check_tags(tags):
     with open_database() as connection:
         with connection as cursor:
             for tag in tags:
-                channel_id_name_list += _channels_with_tag(cursor, tag)
+                channel_id_name_list += _channels_with_tag(cursor, tag, exclude_muted=True)
 
     channel_names.update(channel_id_name_list)
     check_channels_if_necessary([item[0] for item in channel_id_name_list])
@@ -369,7 +380,7 @@ def import_subscriptions(env, start_response):
 
 
 sub_list_item_template = Template('''
-<li>
+<li class="sub-list-item $mute_class">
     <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
     <a href="$channel_url" class="sub-list-item-name" title="$channel_name">$channel_name</a>
     <span class="tag-list">$tags</span>
@@ -394,12 +405,13 @@ def get_subscription_manager_page(env, start_response):
                 main_list_html = '<ul class="tag-group-list">'
                 for tag in _get_all_tags(cursor):
                     sub_list_html = ''
-                    for channel_id, channel_name in _channels_with_tag(cursor, tag, order=True):
+                    for channel_id, channel_name, muted in _channels_with_tag(cursor, tag, order=True, include_muted_status=True):
                         sub_list_html += sub_list_item_template.substitute(
                             channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                             channel_name = html.escape(channel_name),
                             channel_id = channel_id,
                             tags = ', '.join(t for t in _get_tags(cursor, channel_id) if t != tag),
+                            mute_class = 'muted' if muted else '',
                         )
                     main_list_html += tag_group_template.substitute(
                         tag = tag,
@@ -407,7 +419,7 @@ def get_subscription_manager_page(env, start_response):
                     )
 
                 # Channels with no tags
-                channel_list = cursor.execute('''SELECT yt_channel_id, channel_name
+                channel_list = cursor.execute('''SELECT yt_channel_id, channel_name, muted
                                                  FROM subscribed_channels
                                                  WHERE id NOT IN (
                                                      SELECT sql_channel_id FROM tag_associations
@@ -415,12 +427,13 @@ def get_subscription_manager_page(env, start_response):
                                                  ORDER BY channel_name COLLATE NOCASE''').fetchall()
                 if channel_list:
                     sub_list_html = ''
-                    for channel_id, channel_name in channel_list:
+                    for channel_id, channel_name, muted in channel_list:
                         sub_list_html += sub_list_item_template.substitute(
                             channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                             channel_name = html.escape(channel_name),
                             channel_id = channel_id,
                             tags = '',
+                            mute_class = 'muted' if muted else '',
                         )
                     main_list_html += tag_group_template.substitute(
                         tag = "No tags",
@@ -434,12 +447,13 @@ def get_subscription_manager_page(env, start_response):
                 sort_link = util.URL_ORIGIN + '/subscription_manager?group_by_tags=1'
 
                 main_list_html = '<ol class="sub-list">'
-                for channel_name, channel_id in _get_subscribed_channels(cursor):
+                for channel_name, channel_id, muted in _get_subscribed_channels(cursor):
                     main_list_html += sub_list_item_template.substitute(
                         channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                         channel_name = html.escape(channel_name),
                         channel_id = channel_id,
                         tags = ', '.join(_get_tags(cursor, channel_id)),
+                        mute_class = 'muted' if muted else '',
                     )
                 main_list_html += '</ol>'
 
@@ -464,42 +478,53 @@ def post_subscription_manager_page(env, start_response):
     params = env['parameters']
     action = params['action'][0]
 
-    if action == 'add_tags':
-        with_open_db(_add_tags, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
-    elif action == 'remove_tags':
-        with_open_db(_remove_tags, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
-    elif action == 'unsubscribe':
-        with_open_db(_unsubscribe, params['channel_ids'])
-    elif action == 'unsubscribe_verify':
-        page = '''
-        <span>Are you sure you want to unsubscribe from these channels?</span>
-        <form class="subscriptions-import-form" action="/youtube.com/subscription_manager" method="POST">'''
-
-        for channel_id in params['channel_ids']:
-            page += '<input type="hidden" name="channel_ids" value="' + channel_id + '">\n'
-
-        page += '''
-            <input type="hidden" name="action" value="unsubscribe">
-            <input type="submit" value="Yes, unsubscribe">
-        </form>
-        <ul>'''
-        for channel_id, channel_name in with_open_db(_get_channel_names, params['channel_ids']):
-            page += unsubscribe_list_item_template.substitute(
-                channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                channel_name = html.escape(channel_name),
-            )
-        page += '''</ul>'''
-
-        start_response('200 OK', [('Content-type','text/html'),])
-        return html_common.yt_basic_template.substitute(
-            page_title = 'Unsubscribe?',
-            style = '',
-            header = html_common.get_header(),
-            page = page,
-        ).encode('utf-8')
-    else:
-        start_response('400 Bad Request', ())
-        return b'400 Bad Request'
+    with open_database() as connection:
+        with connection as cursor:
+            if action == 'add_tags':
+                _add_tags(cursor, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+            elif action == 'remove_tags':
+                _remove_tags(cursor, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+            elif action == 'unsubscribe':
+                _unsubscribe(cursor, params['channel_ids'])
+            elif action == 'unsubscribe_verify':
+                page = '''
+                <span>Are you sure you want to unsubscribe from these channels?</span>
+                <form class="subscriptions-import-form" action="/youtube.com/subscription_manager" method="POST">'''
+
+                for channel_id in params['channel_ids']:
+                    page += '<input type="hidden" name="channel_ids" value="' + channel_id + '">\n'
+
+                page += '''
+                    <input type="hidden" name="action" value="unsubscribe">
+                    <input type="submit" value="Yes, unsubscribe">
+                </form>
+                <ul>'''
+                for channel_id, channel_name in _get_channel_names(cursor, params['channel_ids']):
+                    page += unsubscribe_list_item_template.substitute(
+                        channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
+                        channel_name = html.escape(channel_name),
+                    )
+                page += '''</ul>'''
+
+                start_response('200 OK', [('Content-type','text/html'),])
+                return html_common.yt_basic_template.substitute(
+                    page_title = 'Unsubscribe?',
+                    style = '',
+                    header = html_common.get_header(),
+                    page = page,
+                ).encode('utf-8')
+            elif action == 'mute':
+                cursor.executemany('''UPDATE subscribed_channels
+                                      SET muted = 1
+                                      WHERE yt_channel_id = ?''', [(ci,) for ci in params['channel_ids']])
+            elif action == 'unmute':
+                cursor.executemany('''UPDATE subscribed_channels
+                                      SET muted = 0
+                                      WHERE yt_channel_id = ?''', [(ci,) for ci in params['channel_ids']])
+
+            else:
+                start_response('400 Bad Request', ())
+                return b'400 Bad Request'
 
     start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
     return b''
@@ -507,7 +532,7 @@ def post_subscription_manager_page(env, start_response):
 
 
 sidebar_tag_item_template = Template('''
-<li>
+<li class="sidebar-list-item">
     <span class="sidebar-item-name">$tag_name</span>
     <form method="POST" class="sidebar-item-refresh">
         <input type="submit" value="Check">
@@ -519,7 +544,7 @@ sidebar_tag_item_template = Template('''
 
 
 sidebar_channel_item_template = Template('''
-<li>
+<li class="sidebar-list-item $mute_class">
     <a href="$channel_url" class="sidebar-item-name" title="$channel_name">$channel_name</a>
     <form method="POST" class="sidebar-item-refresh">
         <input type="submit" value="Check">
@@ -549,11 +574,12 @@ def get_subscriptions_page(env, start_response):
 
 
             sub_list_html = ''
-            for channel_name, channel_id in _get_subscribed_channels(cursor):
+            for channel_name, channel_id, muted in _get_subscribed_channels(cursor):
                 sub_list_html += sidebar_channel_item_template.substitute(
                     channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
                     channel_name = html.escape(channel_name),
                     channel_id = channel_id,
+                    mute_class = 'muted' if muted else '',
                 )
 
 
-- 
cgit v1.2.3


From cc9283ad5332f59a69a91d9d0fab299779de513c Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Tue, 11 Jun 2019 01:50:01 -0700
Subject: Fix checking specific channels

---
 youtube/subscriptions.py | 1 +
 1 file changed, 1 insertion(+)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 5d049be..fdba114 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -320,6 +320,7 @@ def check_tags(tags):
 def check_specific_channels(channel_ids):
     with open_database() as connection:
         with connection as cursor:
+            channel_id_name_list = []
             for channel_id in channel_ids:
                 channel_id_name_list += cursor.execute('''SELECT yt_channel_id, channel_name
                                                           FROM subscribed_channels
-- 
cgit v1.2.3


From 163814d35cbcad575d0deec54b31b94e2bbaaebb Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 10 Aug 2019 00:09:03 -0700
Subject: Convert subscriptions page to flask framework

---
 youtube/subscriptions.py             | 160 ++++++++++++++---------------------
 youtube/templates/subscriptions.html |  97 +++++++++++++++++++++
 2 files changed, 161 insertions(+), 96 deletions(-)
 create mode 100644 youtube/templates/subscriptions.html

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index fdba114..a238ae4 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -1,21 +1,18 @@
-from youtube import util, yt_data_extract, html_common, channel
+from youtube import util, yt_data_extract, channel
+from youtube import yt_app
 import settings
-from string import Template
+
 import sqlite3
 import os
 import time
 import gevent
-import html
 import json
 import traceback
 import contextlib
 import defusedxml.ElementTree
 
-with open('yt_subscriptions_template.html', 'r', encoding='utf-8') as f:
-    subscriptions_template = Template(f.read())
-
-with open('yt_subscription_manager_template.html', 'r', encoding='utf-8') as f:
-    subscription_manager_template = Template(f.read())
+import flask
+from flask import request
 
 
 thumbnails_directory = os.path.join(settings.data_dir, "subscription_thumbnails")
@@ -272,16 +269,15 @@ def _get_upstream_videos(channel_id):
 
     videos = []
 
-    json_channel_videos = channel.get_grid_items(channel.get_channel_tab(channel_id)[1]['response'])
-    for i, json_video in enumerate(json_channel_videos):
-        info = yt_data_extract.renderer_info(json_video['gridVideoRenderer'])
-        if 'description' not in info:
-            info['description'] = ''
+    channel_videos = channel.extract_info(json.loads(channel.get_channel_tab(channel_id)), 'videos')['items']
+    for i, video_item in enumerate(channel_videos):
+        if 'description' not in video_item:
+            video_item['description'] = ''
         try:
-            info['time_published'] = youtube_timestamp_to_posix(info['published']) - i  # subtract a few seconds off the videos so they will be in the right order
+            video_item['time_published'] = youtube_timestamp_to_posix(video_item['published']) - i  # subtract a few seconds off the videos so they will be in the right order
         except KeyError:
-            print(info)
-        videos.append((channel_id, info['id'], info['title'], info['duration'], info['time_published'], info['description']))
+            print(video_item)
+        videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['description']))
 
     now = time.time()
     download_thumbnails_if_necessary(video[1] for video in videos if (now - video[4]) < 30*24*3600) # Don't download thumbnails from videos older than a month
@@ -380,7 +376,7 @@ def import_subscriptions(env, start_response):
 
 
-sub_list_item_template = Template('''
+"""sub_list_item_template = Template('''
 <li class="sub-list-item $mute_class">
     <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
     <a href="$channel_url" class="sub-list-item-name" title="$channel_name">$channel_name</a>
@@ -394,7 +390,7 @@ tag_group_template = Template('''
 $sub_list
     </ol>
 </li>
-''')
+''')"""
 def get_subscription_manager_page(env, start_response):
     with open_database() as connection:
         with connection as cursor:
@@ -473,8 +469,8 @@ def list_from_comma_separated_tags(string):
     return [tag.strip() for tag in string.split(',') if tag.strip()]
 
 
-unsubscribe_list_item_template = Template('''
-<li><a href="$channel_url" title="$channel_name">$channel_name</a></li>''')
+"""unsubscribe_list_item_template = Template('''
+<li><a href="$channel_url" title="$channel_name">$channel_name</a></li>''')"""
 def post_subscription_manager_page(env, start_response):
     params = env['parameters']
     action = params['action'][0]
@@ -531,97 +527,69 @@ def post_subscription_manager_page(env, start_response):
     return b''
 
 
-
-sidebar_tag_item_template = Template('''
-<li class="sidebar-list-item">
-    <span class="sidebar-item-name">$tag_name</span>
-    <form method="POST" class="sidebar-item-refresh">
-        <input type="submit" value="Check">
-        <input type="hidden" name="action" value="refresh">
-        <input type="hidden" name="type" value="tag">
-        <input type="hidden" name="tag_name" value="$tag_name">
-    </form>
-</li>''')
-
-
-sidebar_channel_item_template = Template('''
-<li class="sidebar-list-item $mute_class">
-    <a href="$channel_url" class="sidebar-item-name" title="$channel_name">$channel_name</a>
-    <form method="POST" class="sidebar-item-refresh">
-        <input type="submit" value="Check">
-        <input type="hidden" name="action" value="refresh">
-        <input type="hidden" name="type" value="channel">
-        <input type="hidden" name="channel_id" value="$channel_id">
-    </form>
-</li>''')
-
-def get_subscriptions_page(env, start_response):
+@yt_app.route('/subscriptions', methods=['GET'])
+@yt_app.route('/feed/subscriptions', methods=['GET'])
+def get_subscriptions_page():
     with open_database() as connection:
         with connection as cursor:
-            items_html = '''<nav class="item-grid">\n'''
-
-            for item in _get_videos(cursor, 60, 0):
-                if item['id'] in downloading_thumbnails:
-                    item['thumbnail'] = util.get_thumbnail_url(item['id'])
+            videos = []
+            for video in _get_videos(cursor, 60, 0):
+                if video['id'] in downloading_thumbnails:
+                    video['thumbnail'] = util.get_thumbnail_url(video['id'])
                 else:
-                    item['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + item['id'] + '.jpg'
-                items_html += html_common.video_item_html(item, html_common.small_video_item_template)
-            items_html += '''\n</nav>'''
-
+                    video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
+                video['type'] = 'video'
+                video['item_size'] = 'small'
+                videos.append(video)
 
-            tag_list_html = ''
-            for tag_name in _get_all_tags(cursor):
-                tag_list_html += sidebar_tag_item_template.substitute(tag_name = tag_name)
+            tags = _get_all_tags(cursor)
 
 
-            sub_list_html = ''
+            subscription_list = []
             for channel_name, channel_id, muted in _get_subscribed_channels(cursor):
-                sub_list_html += sidebar_channel_item_template.substitute(
-                    channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                    channel_name = html.escape(channel_name),
-                    channel_id = channel_id,
-                    mute_class = 'muted' if muted else '',
-                )
-
-
-
-    start_response('200 OK', [('Content-type','text/html'),])
-    return subscriptions_template.substitute(
-        header = html_common.get_header(),
-        items = items_html,
-        tags = tag_list_html,
-        sub_list = sub_list_html,
-        page_buttons = '',
-    ).encode('utf-8')
-
-def post_subscriptions_page(env, start_response):
-    params = env['parameters']
-    action = params['action'][0]
+                subscription_list.append({
+                    'channel_url': util.URL_ORIGIN + '/channel/' + channel_id,
+                    'channel_name': channel_name,
+                    'channel_id': channel_id,
+                    'muted': muted,
+                })
+
+    return flask.render_template('subscriptions.html',
+        videos = videos,
+        tags = tags,
+        subscription_list = subscription_list,
+    )
+
+@yt_app.route('/subscriptions', methods=['POST'])
+@yt_app.route('/feed/subscriptions', methods=['POST'])
+def post_subscriptions_page():
+    action = request.values['action']
     if action == 'subscribe':
-        if len(params['channel_id']) != len(params['channel_name']):
-            start_response('400 Bad Request', ())
-            return b'400 Bad Request, length of channel_id != length of channel_name'
-        with_open_db(_subscribe, zip(params['channel_id'], params['channel_name']))
+        if len(request.values.getlist('channel_id')) != len(request.values('channel_name')):
+            return '400 Bad Request, length of channel_id != length of channel_name', 400
+        with_open_db(_subscribe, zip(request.values.getlist('channel_id'), request.values.getlist('channel_name')))
 
     elif action == 'unsubscribe':
-        with_open_db(_unsubscribe, params['channel_id'])
+        with_open_db(_unsubscribe, request.values.getlist('channel_id'))
 
     elif action == 'refresh':
-        type = params['type'][0]
+        type = request.values['type']
         if type == 'all':
             check_all_channels()
         elif type == 'tag':
-            check_tags(params['tag_name'])
+            check_tags(request.values.getlist('tag_name'))
         elif type == 'channel':
-            check_specific_channels(params['channel_id'])
+            check_specific_channels(request.values.getlist('channel_id'))
         else:
-            start_response('400 Bad Request', ())
-            return b'400 Bad Request'
-
-        start_response('204 No Content', ())
-        return b''
+            flask.abort(400)
     else:
-        start_response('400 Bad Request', ())
-        return b'400 Bad Request'
-    start_response('204 No Content', ())
-    return b''
+        flask.abort(400)
+
+    return '', 204
+
+
+@yt_app.route('/data/subscription_thumbnails/<thumbnail>')
+def serve_subscription_thumbnail(thumbnail):
+    # .. is necessary because flask always uses the application directory at ./youtube, not the working directory
+    return flask.send_from_directory(os.path.join('..', thumbnails_directory), thumbnail)
+
diff --git a/youtube/templates/subscriptions.html b/youtube/templates/subscriptions.html
new file mode 100644
index 0000000..a3227b1
--- /dev/null
+++ b/youtube/templates/subscriptions.html
@@ -0,0 +1,97 @@
+{% set page_title = 'Subscriptions' %}
+{% extends "base.html" %}
+{% import "common_elements.html" as common_elements %}
+
+{% block style %}
+    main{
+        display:flex;
+        flex-direction: row;
+    }
+    .item-grid{
+        flex-grow: 1;
+    }
+    .subscriptions-sidebar{
+        flex-basis: 300px;
+        background-color: #dadada;
+        border-left: 2px;
+    }
+        .sidebar-links{
+            display:flex;
+            justify-content: space-between;
+            padding-left:10px;
+            padding-right: 10px;
+        }
+
+        .sidebar-list{
+            list-style: none;
+            padding-left:10px;
+            padding-right: 10px;
+        }
+            .sidebar-list-item{
+                display:flex;
+                justify-content: space-between;
+                margin-bottom: 5px;
+            }
+                .sub-refresh-list .sidebar-item-name{
+                    text-overflow: clip;
+                    white-space: nowrap;
+                    overflow: hidden;
+                    max-width: 200px;
+                }
+            .muted{
+                background-color: #888888;
+            }
+{% endblock style %}
+
+{% block main %}
+    <nav class="item-grid">
+        {% for video_info in videos %}
+            {{ common_elements.item(video_info, include_author=false) }}
+        {% endfor %}
+    </nav>
+
+    <div class="subscriptions-sidebar">
+        <div class="sidebar-links">
+            <a href="/youtube.com/subscription_manager" class="sub-manager-link">Subscription Manager</a>
+            <form method="POST" class="refresh-all">
+                <input type="submit" value="Check All">
+                <input type="hidden" name="action" value="refresh">
+                <input type="hidden" name="type" value="all">
+            </form>
+        </div>
+
+        <hr>
+        <ol class="sidebar-list tags">
+            {% for tag in tags %}
+                <li class="sidebar-list-item">
+                    <span class="sidebar-item-name">{{ tag }}</span>
+                    <form method="POST" class="sidebar-item-refresh">
+                        <input type="submit" value="Check">
+                        <input type="hidden" name="action" value="refresh">
+                        <input type="hidden" name="type" value="tag">
+                        <input type="hidden" name="tag_name" value="{{ tag }}">
+                    </form>
+                </li>
+            {% endfor %}
+        </ol>
+
+        <ol class="sidebar-list sub-refresh-list">
+            {% for subscription in subscription_list %}
+                <li class="sidebar-list-item {{ 'muted' if subscription['muted'] else '' }}">
+                    <a href="{{ subscription['channel_url'] }}" class="sidebar-item-name" title="{{ subscription['channel_name'] }}">{{ subscription['channel_name'] }}</a>
+                    <form method="POST" class="sidebar-item-refresh">
+                        <input type="submit" value="Check">
+                        <input type="hidden" name="action" value="refresh">
+                        <input type="hidden" name="type" value="channel">
+                        <input type="hidden" name="channel_id" value="{{ subscription['channel_id'] }}">
+                    </form>
+                </li>
+            {% endfor %}
+        </ol>
+
+    </div>
+
+    <nav class="page-button-row">
+        {# TODO #}
+    </nav>
+{% endblock main %}
-- 
cgit v1.2.3


From 33bba9762c7f96a754351f3422f74364c5bdecac Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 10 Aug 2019 17:05:14 -0700
Subject: Convert subscription manager to flask framework

---
 youtube/subscriptions.py                    | 210 +++++++++++-----------------
 youtube/templates/subscription_manager.html | 141 +++++++++++++++++++
 youtube/templates/unsubscribe_verify.html   |  19 +++
 3 files changed, 242 insertions(+), 128 deletions(-)
 create mode 100644 youtube/templates/subscription_manager.html
 create mode 100644 youtube/templates/unsubscribe_verify.html

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index a238ae4..fa0570c 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -326,28 +326,38 @@ def check_specific_channels(channel_ids):
 
 
+@yt_app.route('/import_subscriptions', methods=['POST'])
+def import_subscriptions():
 
-def import_subscriptions(env, start_response):
-    content_type = env['parameters']['subscriptions_file'][0]
-    file = env['parameters']['subscriptions_file'][1]
+    # check if the post request has the file part
+    if 'subscriptions_file' not in request.files:
+        #flash('No file part')
+        return flask.redirect(util.URL_ORIGIN + request.full_path)
+    file = request.files['subscriptions_file']
+    # if user does not select file, browser also
+    # submit an empty part without filename
+    if file.filename == '':
+        #flash('No selected file')
+        return flask.redirect(util.URL_ORIGIN + request.full_path)
 
-    file = file.decode('utf-8')
 
-    if content_type == 'application/json':
+    mime_type = file.mimetype
+
+    if mime_type == 'application/json':
+        file = file.read().decode('utf-8')
         try:
             file = json.loads(file)
         except json.decoder.JSONDecodeError:
             traceback.print_exc()
-            start_response('400 Bad Request', () )
-            return b'400 Bad Request: Invalid json file'
+            return '400 Bad Request: Invalid json file', 400
 
         try:
             channels = ( (item['snippet']['resourceId']['channelId'], item['snippet']['title']) for item in file)
         except (KeyError, IndexError):
             traceback.print_exc()
-            start_response('400 Bad Request', () )
-            return b'400 Bad Request: Unknown json structure'
-    elif content_type in ('application/xml', 'text/xml', 'text/x-opml'):
+            return '400 Bad Request: Unknown json structure', 400
+    elif mime_type in ('application/xml', 'text/xml', 'text/x-opml'):
+        file = file.read().decode('utf-8')
         try:
             root = defusedxml.ElementTree.fromstring(file)
             assert root.tag == 'opml'
@@ -363,57 +373,36 @@ def import_subscriptions(env, start_response):
                 channels.append( (channel_id, channel_name) )
 
         except (AssertionError, IndexError, defusedxml.ElementTree.ParseError) as e:
-            start_response('400 Bad Request', () )
-            return b'400 Bad Request: Unable to read opml xml file, or the file is not the expected format'
+            return '400 Bad Request: Unable to read opml xml file, or the file is not the expected format', 400
     else:
-            start_response('400 Bad Request', () )
-            return b'400 Bad Request: Unsupported file format: ' + html.escape(content_type).encode('utf-8') + b'. Only subscription.json files (from Google Takeouts) and XML OPML files exported from Youtube\'s subscription manager page are supported'
+            return '400 Bad Request: Unsupported file format: ' + mime_type + '. Only subscription.json files (from Google Takeouts) and XML OPML files exported from Youtube\'s subscription manager page are supported', 400
 
     with_open_db(_subscribe, channels)
 
-    start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
-    return b''
-
+    return flask.redirect(util.URL_ORIGIN + '/subscription_manager', 303)
 
 
-"""sub_list_item_template = Template('''
-<li class="sub-list-item $mute_class">
-    <input class="sub-list-checkbox" name="channel_ids" value="$channel_id" form="subscription-manager-form" type="checkbox">
-    <a href="$channel_url" class="sub-list-item-name" title="$channel_name">$channel_name</a>
-    <span class="tag-list">$tags</span>
-</li>''')
 
-tag_group_template = Template('''
-<li class="tag-group">
-    <h2 class="tag-group-name">$tag</h2>
-    <ol class="sub-list">
-$sub_list
-    </ol>
-</li>
-''')"""
-def get_subscription_manager_page(env, start_response):
+@yt_app.route('/subscription_manager', methods=['GET'])
+def get_subscription_manager_page():
+    group_by_tags = request.args.get('group_by_tags', '0') == '1'
     with open_database() as connection:
         with connection as cursor:
-            if env['parameters'].get('group_by_tags', '0')[0] == '1':
+            if group_by_tags:
+                tag_groups = []
 
-                sort_name = "Don't group"
-                sort_link = util.URL_ORIGIN + '/subscription_manager'
-
-                main_list_html = '<ul class="tag-group-list">'
                 for tag in _get_all_tags(cursor):
-                    sub_list_html = ''
+                    sub_list = []
                     for channel_id, channel_name, muted in _channels_with_tag(cursor, tag, order=True, include_muted_status=True):
-                        sub_list_html += sub_list_item_template.substitute(
-                            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                            channel_name = html.escape(channel_name),
-                            channel_id = channel_id,
-                            tags = ', '.join(t for t in _get_tags(cursor, channel_id) if t != tag),
-                            mute_class = 'muted' if muted else '',
-                        )
-                    main_list_html += tag_group_template.substitute(
-                        tag = tag,
-                        sub_list = sub_list_html,
-                    )
+                        sub_list.append({
+                            'channel_url': util.URL_ORIGIN + '/channel/' + channel_id,
+                            'channel_name': channel_name,
+                            'channel_id': channel_id,
+                            'muted': muted,
+                            'tags': [t for t in _get_tags(cursor, channel_id) if t != tag],
+                        })
+
+                    tag_groups.append( (tag, sub_list) )
 
                 # Channels with no tags
                 channel_list = cursor.execute('''SELECT yt_channel_id, channel_name, muted
@@ -423,109 +412,74 @@ def get_subscription_manager_page(env, start_response):
                                                  )
                                                  ORDER BY channel_name COLLATE NOCASE''').fetchall()
                 if channel_list:
-                    sub_list_html = ''
+                    sub_list = []
                     for channel_id, channel_name, muted in channel_list:
-                        sub_list_html += sub_list_item_template.substitute(
-                            channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                            channel_name = html.escape(channel_name),
-                            channel_id = channel_id,
-                            tags = '',
-                            mute_class = 'muted' if muted else '',
-                        )
-                    main_list_html += tag_group_template.substitute(
-                        tag = "No tags",
-                        sub_list = sub_list_html,
-                    )
-                main_list_html += '</ul>'
-
+                        sub_list.append({
+                            'channel_url': util.URL_ORIGIN + '/channel/' + channel_id,
+                            'channel_name': channel_name,
+                            'channel_id': channel_id,
+                            'muted': muted,
+                            'tags': [],
+                        })
+
+                    tag_groups.append( ('No tags', sub_list) )
             else:
+                sub_list = []
+                for channel_name, channel_id, muted in _get_subscribed_channels(cursor):
+                    sub_list.append({
+                        'channel_url': util.URL_ORIGIN + '/channel/' + channel_id,
+                        'channel_name': channel_name,
+                        'channel_id': channel_id,
+                        'muted': muted,
+                        'tags': _get_tags(cursor, channel_id),
+                    })
 
-                sort_name = "Group by tags"
-                sort_link = util.URL_ORIGIN + '/subscription_manager?group_by_tags=1'
 
-                main_list_html = '<ol class="sub-list">'
-                for channel_name, channel_id, muted in _get_subscribed_channels(cursor):
-                    main_list_html += sub_list_item_template.substitute(
-                        channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                        channel_name = html.escape(channel_name),
-                        channel_id = channel_id,
-                        tags = ', '.join(_get_tags(cursor, channel_id)),
-                        mute_class = 'muted' if muted else '',
-                    )
-                main_list_html += '</ol>'
-
-
-
-    start_response('200 OK', [('Content-type','text/html'),])
-    return subscription_manager_template.substitute(
-        header = html_common.get_header(),
-        main_list = main_list_html,
-        sort_name = sort_name,
-        sort_link = sort_link,
-        page_buttons = '',
-    ).encode('utf-8')
+
+
+    if group_by_tags:
+        return flask.render_template('subscription_manager.html',
+            group_by_tags = True,
+            tag_groups = tag_groups,
+        )
+    else:
+        return flask.render_template('subscription_manager.html',
+            group_by_tags = False,
+            sub_list = sub_list,
+        )
 
 def list_from_comma_separated_tags(string):
     return [tag.strip() for tag in string.split(',') if tag.strip()]
 
 
-"""unsubscribe_list_item_template = Template('''
-<li><a href="$channel_url" title="$channel_name">$channel_name</a></li>''')"""
-def post_subscription_manager_page(env, start_response):
-    params = env['parameters']
-    action = params['action'][0]
+@yt_app.route('/subscription_manager', methods=['POST'])
+def post_subscription_manager_page():
+    action = request.values['action']
 
     with open_database() as connection:
         with connection as cursor:
             if action == 'add_tags':
-                _add_tags(cursor, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+                _add_tags(cursor, request.values.getlist('channel_ids'), [tag.lower() for tag in list_from_comma_separated_tags(request.values['tags'])])
             elif action == 'remove_tags':
-                _remove_tags(cursor, params['channel_ids'], [tag.lower() for tag in list_from_comma_separated_tags(params['tags'][0])])
+                _remove_tags(cursor, request.values.getlist('channel_ids'), [tag.lower() for tag in list_from_comma_separated_tags(request.values['tags'])])
             elif action == 'unsubscribe':
-                _unsubscribe(cursor, params['channel_ids'])
+                _unsubscribe(cursor, request.values.getlist('channel_ids'))
             elif action == 'unsubscribe_verify':
-                page = '''
-                <span>Are you sure you want to unsubscribe from these channels?</span>
-                <form class="subscriptions-import-form" action="/youtube.com/subscription_manager" method="POST">'''
-
-                for channel_id in params['channel_ids']:
-                    page += '<input type="hidden" name="channel_ids" value="' + channel_id + '">\n'
-
-                page += '''
-                    <input type="hidden" name="action" value="unsubscribe">
-                    <input type="submit" value="Yes, unsubscribe">
-                </form>
-                <ul>'''
-                for channel_id, channel_name in _get_channel_names(cursor, params['channel_ids']):
-                    page += unsubscribe_list_item_template.substitute(
-                        channel_url = util.URL_ORIGIN + '/channel/' + channel_id,
-                        channel_name = html.escape(channel_name),
-                    )
-                page += '''</ul>'''
-
-                start_response('200 OK', [('Content-type','text/html'),])
-                return html_common.yt_basic_template.substitute(
-                    page_title = 'Unsubscribe?',
-                    style = '',
-                    header = html_common.get_header(),
-                    page = page,
-                ).encode('utf-8')
+                unsubscribe_list = _get_channel_names(cursor, request.values.getlist('channel_ids'))
+                return flask.render_template('unsubscribe_verify.html', unsubscribe_list = unsubscribe_list)
+
             elif action == 'mute':
                 cursor.executemany('''UPDATE subscribed_channels
                                       SET muted = 1
-                                      WHERE yt_channel_id = ?''', [(ci,) for ci in params['channel_ids']])
+                                      WHERE yt_channel_id = ?''', [(ci,) for ci in request.values.getlist('channel_ids')])
             elif action == 'unmute':
                 cursor.executemany('''UPDATE subscribed_channels
                                       SET muted = 0
-                                      WHERE yt_channel_id = ?''', [(ci,) for ci in params['channel_ids']])
-
+                                      WHERE yt_channel_id = ?''', [(ci,) for ci in request.values.getlist('channel_ids')])
             else:
-                start_response('400 Bad Request', ())
-                return b'400 Bad Request'
-
-    start_response('303 See Other', [('Location', util.URL_ORIGIN + '/subscription_manager'),] )
-    return b''
+                flask.abort(400)
 
+    return flask.redirect(util.URL_ORIGIN + request.full_path, 303)
 
 @yt_app.route('/subscriptions', methods=['GET'])
 @yt_app.route('/feed/subscriptions', methods=['GET'])
diff --git a/youtube/templates/subscription_manager.html b/youtube/templates/subscription_manager.html
new file mode 100644
index 0000000..838f4af
--- /dev/null
+++ b/youtube/templates/subscription_manager.html
@@ -0,0 +1,141 @@
+{% set page_title = 'Subscription Manager' %}
+{% extends "base.html" %}
+{% block style %}
+    .import-export{
+        display: flex;
+        flex-direction: row;
+    }
+        .subscriptions-import-form{
+            background-color: #dadada;
+            display: flex;
+            flex-direction: column;
+            align-items: flex-start;
+            max-width: 300px;
+            padding:10px;
+        }
+            .subscriptions-import-form h2{
+                font-size: 20px;
+                margin-bottom: 10px;
+            }
+
+            .import-submit-button{
+                margin-top:15px;
+                align-self: flex-end;
+            }
+
+
+        .subscriptions-export-links{
+            margin: 0px 0px 0px 20px;
+            background-color: #dadada;
+            list-style: none;
+            max-width: 300px;
+            padding:10px;
+        }
+
+    .sub-list-controls{
+        background-color: #dadada;
+        padding:10px;
+    }
+
+
+    .tag-group-list{
+        list-style: none;
+        margin-left: 10px;
+        margin-right: 10px;
+        padding: 0px;
+    }
+        .tag-group{
+            border-style: solid;
+            margin-bottom: 10px;
+        }
+
+    .sub-list{
+        list-style: none;
+        padding:10px;
+        column-width: 300px;
+        column-gap: 40px;
+    }
+        .sub-list-item{
+            display:flex;
+            margin-bottom: 10px;
+            background-color: #dadada;
+        }
+            .tag-list{
+                margin-left:15px;
+                font-weight:bold;
+            }
+            .sub-list-item-name{
+                margin-left:15px;
+            }
+            .sub-list-checkbox{
+                height: 1.5em;
+                width: 1.5em;
+            }
+        .muted{
+            background-color: #888888;
+        }
+{% endblock style %}
+
+
+{% macro subscription_list(sub_list) %}
+    {% for subscription in sub_list %}
+        <li class="sub-list-item {{ 'muted' if subscription['muted'] else '' }}">
+            <input class="sub-list-checkbox" name="channel_ids" value="{{ subscription['channel_id'] }}" form="subscription-manager-form" type="checkbox">
+            <a href="{{ subscription['channel_url'] }}" class="sub-list-item-name" title="{{ subscription['channel_name'] }}">{{ subscription['channel_name'] }}</a>
+            <span class="tag-list">{{ ', '.join(subscription['tags']) }}</span>
+        </li>
+    {% endfor %}
+{% endmacro %}
+
+
+
+{% block main %}
+    <div class="import-export">
+        <form class="subscriptions-import-form" enctype="multipart/form-data" action="/youtube.com/import_subscriptions" method="POST">
+            <h2>Import subscriptions</h2>
+            <input type="file" id="subscriptions-import" accept="application/json, application/xml, text/x-opml" name="subscriptions_file">
+            <input type="submit" value="Import" class="import-submit-button">
+        </form>
+
+        <ul class="subscriptions-export-links">
+            <li><a href="/youtube.com/subscriptions.opml">Export subscriptions (OPML)</a></li>
+            <li><a href="/youtube.com/subscriptions.xml">Export subscriptions (RSS)</a></li>
+        </ul>
+    </div>
+
+    <hr>
+
+    <form id="subscription-manager-form" class="sub-list-controls" method="POST">
+        {% if group_by_tags %}
+            <a class="sort-button" href="/https://www.youtube.com/subscription_manager?group_by_tags=0">Don't group</a>
+        {% else %}
+            <a class="sort-button" href="/https://www.youtube.com/subscription_manager?group_by_tags=1">Group by tags</a>
+        {% endif %}
+        <input type="text" name="tags">
+        <button type="submit" name="action" value="add_tags">Add tags</button>
+        <button type="submit" name="action" value="remove_tags">Remove tags</button>
+        <button type="submit" name="action" value="unsubscribe_verify">Unsubscribe</button>
+        <button type="submit" name="action" value="mute">Mute</button>
+        <button type="submit" name="action" value="unmute">Unmute</button>
+        <input type="reset" value="Clear Selection">
+    </form>
+
+
+    {% if group_by_tags %}
+        <ul class="tag-group-list">
+            {% for tag_name, sub_list in tag_groups %}
+                <li class="tag-group">
+                    <h2 class="tag-group-name">{{ tag_name }}</h2>
+                    <ol class="sub-list">
+                        {{ subscription_list(sub_list) }}
+                    </ol>
+                </li>
+            {% endfor %}
+        </ul>
+    {% else %}
+        <ol class="sub-list">
+            {{ subscription_list(sub_list) }}
+        </ol>
+    {% endif %}
+
+{% endblock main %}
diff --git a/youtube/templates/unsubscribe_verify.html b/youtube/templates/unsubscribe_verify.html
new file mode 100644
index 0000000..98581c0
--- /dev/null
+++ b/youtube/templates/unsubscribe_verify.html
@@ -0,0 +1,19 @@
+{% set page_title = 'Unsubscribe?' %}
+{% extends "base.html" %}
+
+{% block main %}
+    <span>Are you sure you want to unsubscribe from these channels?</span>
+    <form class="subscriptions-import-form" action="/youtube.com/subscription_manager" method="POST">
+        {% for channel_id, channel_name in unsubscribe_list %}
+            <input type="hidden" name="channel_ids" value="{{ channel_id }}">
+        {% endfor %}
+
+        <input type="hidden" name="action" value="unsubscribe">
+        <input type="submit" value="Yes, unsubscribe">
+    </form>
+    <ul>
+        {% for channel_id, channel_name in unsubscribe_list %}
+            <li><a href="{{ '/https://www.youtube.com/channel/' + channel_id }}" title="{{ channel_name }}">{{ channel_name }}</a></li>
+        {% endfor %}
+    </ul>
+{% endblock main %}
-- 
cgit v1.2.3


From 2617f87e17b94646eb5a248360a7e0f9b7675d3e Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 10 Aug 2019 18:12:02 -0700
Subject: Add subscribe button on channels

---
 youtube/channel.py             | 6 +++---
 youtube/subscriptions.py       | 2 +-
 youtube/templates/channel.html | 9 +++++++++
 3 files changed, 13 insertions(+), 4 deletions(-)

(limited to 'youtube')

diff --git a/youtube/channel.py b/youtube/channel.py
index 4c7d380..9d0532a 100644
--- a/youtube/channel.py
+++ b/youtube/channel.py
@@ -1,5 +1,5 @@
 import base64
-from youtube import util, yt_data_extract, local_playlist
+from youtube import util, yt_data_extract, local_playlist, subscriptions
 from youtube import yt_app
 
 import urllib
@@ -312,7 +312,7 @@ def get_channel_page(channel_id, tab='videos'):
         info['current_sort'] = sort
     elif tab == 'search':
         info['search_box_value'] = query
-
+    info['subscribed'] = subscriptions.is_subscribed(info['channel_id'])
 
     return flask.render_template('channel.html',
         parameters_dictionary = request.args,
@@ -352,7 +352,7 @@ def get_channel_page_general_url(base_url, tab, request):
         info['current_sort'] = sort
     elif tab == 'search':
         info['search_box_value'] = query
-
+    info['subscribed'] = subscriptions.is_subscribed(info['channel_id'])
 
     return flask.render_template('channel.html',
         parameters_dictionary = request.args,
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index fa0570c..c347e76 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -519,7 +519,7 @@ def get_subscriptions_page():
 def post_subscriptions_page():
     action = request.values['action']
     if action == 'subscribe':
-        if len(request.values.getlist('channel_id')) != len(request.values('channel_name')):
+        if len(request.values.getlist('channel_id')) != len(request.values.getlist('channel_name')):
             return '400 Bad Request, length of channel_id != length of channel_name', 400
         with_open_db(_subscribe, zip(request.values.getlist('channel_id'), request.values.getlist('channel_name')))
 
diff --git a/youtube/templates/channel.html b/youtube/templates/channel.html
index 069e33b..a9f3ac9 100644
--- a/youtube/templates/channel.html
+++ b/youtube/templates/channel.html
@@ -23,6 +23,9 @@
             grid-column:2;
             margin-left: 5px;
         }
+            .summary subscribe-unsubscribe, .summary short-description{
+                margin-top: 10px;
+            }
         main .channel-tabs{
             grid-row:2;
             grid-column: 1 / span 2;
@@ -90,6 +93,12 @@
     <div class="summary">
         <h2 class="title">{{ channel_name }}</h2>
         <p class="short-description">{{ short_description }}</p>
+        <form method="POST" action="/youtube.com/subscriptions" class="subscribe-unsubscribe">
+            <input type="submit" value="{{ 'Unsubscribe' if subscribed else 'Subscribe' }}">
+            <input type="hidden" name="channel_id" value="{{ channel_id }}">
+            <input type="hidden" name="channel_name" value="{{ channel_name }}">
+            <input type="hidden" name="action" value="{{ 'unsubscribe' if subscribed else 'subscribe' }}">
+        </form>
     </div>
     <nav class="channel-tabs">
         {% for tab_name in ('Videos', 'Playlists', 'About') %}
-- 
cgit v1.2.3


From 525ec403c0d083eecae9727a0048ad9074c06e04 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 17:09:38 -0700
Subject: Download and save subscription thumbnails when requested by the
 browser, not preemptively

---
 youtube/subscriptions.py | 67 +++++++++++++++++++++++-------------------------
 1 file changed, 32 insertions(+), 35 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index c347e76..b29bf87 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -10,6 +10,7 @@ import json
 import traceback
 import contextlib
 import defusedxml.ElementTree
+import urllib
 
 import flask
 from flask import request
@@ -205,31 +206,12 @@ except FileNotFoundError:
     existing_thumbnails = set()
 
 
-thumbnails_queue = util.RateLimitedQueue()
 check_channels_queue = util.RateLimitedQueue()
-
-
-# Use this to mark a thumbnail acceptable to be retrieved at the request of the browser
-# can't simply check if it's in the queue because items are removed when the download starts, not when it finishes
-downloading_thumbnails = set()
-
 checking_channels = set()
 
 # Just to use for printing channel checking status to console without opening database
 channel_names = dict()
 
-def download_thumbnail_worker():
-    while True:
-        video_id = thumbnails_queue.get()
-        try:
-            success = util.download_thumbnail(thumbnails_directory, video_id)
-            if success:
-                existing_thumbnails.add(video_id)
-        except Exception:
-            traceback.print_exc()
-        finally:
-            downloading_thumbnails.remove(video_id)
-
 def check_channel_worker():
     while True:
         channel_id = check_channels_queue.get()
@@ -239,20 +221,12 @@ def check_channel_worker():
             checking_channels.remove(channel_id)
 
 for i in range(0,5):
-    gevent.spawn(download_thumbnail_worker)
     gevent.spawn(check_channel_worker)
 
 
-
-def download_thumbnails_if_necessary(thumbnails):
-    for video_id in thumbnails:
-        if video_id not in existing_thumbnails and video_id not in downloading_thumbnails:
-            downloading_thumbnails.add(video_id)
-            thumbnails_queue.put(video_id)
-
 def check_channels_if_necessary(channel_ids):
     for channel_id in channel_ids:
         if channel_id not in checking_channels:
@@ -279,8 +253,6 @@ def _get_upstream_videos(channel_id):
             print(video_item)
         videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['description']))
 
-    now = time.time()
-    download_thumbnails_if_necessary(video[1] for video in videos if (now - video[4]) < 30*24*3600) # Don't download thumbnails from videos older than a month
 
     with open_database() as connection:
         with connection as cursor:
@@ -488,10 +460,7 @@ def get_subscriptions_page():
         with connection as cursor:
             videos = []
             for video in _get_videos(cursor, 60, 0):
-                if video['id'] in downloading_thumbnails:
-                    video['thumbnail'] = util.get_thumbnail_url(video['id'])
-                else:
-                    video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
+                video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
                 video['type'] = 'video'
                 video['item_size'] = 'small'
                 videos.append(video)
@@ -544,6 +513,34 @@ def post_subscriptions_page():
 
 @yt_app.route('/data/subscription_thumbnails/<thumbnail>')
 def serve_subscription_thumbnail(thumbnail):
-    # .. is necessary because flask always uses the application directory at ./youtube, not the working directory
-    return flask.send_from_directory(os.path.join('..', thumbnails_directory), thumbnail)
+    assert thumbnail[-4:] == '.jpg'
+    video_id = thumbnail[0:-4]
+    thumbnail_path = os.path.join(thumbnails_directory, thumbnail)
+
+    if video_id in existing_thumbnails:
+        # .. is necessary because flask always uses the application directory at ./youtube, not the working directory
+        return flask.send_from_directory(os.path.join('..', thumbnails_directory), thumbnail)
+    else:
+        url = "https://i.ytimg.com/vi/" + video_id + "/mqdefault.jpg"
+        try:
+            image = util.fetch_url(url, report_text="Saved thumbnail: " + video_id)
+        except urllib.error.HTTPError as e:
+            print("Failed to download thumbnail for " + video_id + ": " + str(e))
+            abort(e.code)
+        try:
+            f = open(thumbnail_path, 'wb')
+        except FileNotFoundError:
+            os.makedirs(thumbnail_path, exist_ok = True)
+            f = open(thumbnail_path, 'wb')
+        f.write(image)
+        f.close()
+        existing_thumbnails.add(video_id)
+
+        return flask.Response(image, mimetype='image/jpeg')
+
+
+
+
+
+
 
-- 
cgit v1.2.3


From 42036f92d25ec8f0a94e4f3af41c0977eca1274a Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 17:25:10 -0700
Subject: Delete thumbnails from channel when unsubscribing

---
 youtube/subscriptions.py | 25 ++++++++++++++++++++++++-
 1 file changed, 24 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index b29bf87..3a0ef49 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -92,9 +92,32 @@ def _subscribe(cursor, channels):
     cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked)
                           VALUES (?, ?, ?)''', channels)
 
-# TODO: delete thumbnails
+
+def delete_thumbnails(to_delete):
+    for thumbnail in to_delete:
+        try:
+            video_id = thumbnail[0:-4]
+            if video_id in existing_thumbnails:
+                os.remove(os.path.join(thumbnails_directory, thumbnail))
+                existing_thumbnails.remove(video_id)
+        except Exception:
+            print('Failed to delete thumbnail: ' + thumbnail)
+            traceback.print_exc()
+
 def _unsubscribe(cursor, channel_ids):
     ''' channel_ids is a list of channel_ids '''
+    to_delete = []
+    for channel_id in channel_ids:
+        rows = cursor.execute('''SELECT video_id
+                                 FROM videos
+                                 WHERE sql_channel_id = (
+                                     SELECT id
+                                     FROM subscribed_channels
+                                     WHERE yt_channel_id=?
+                                 )''', (channel_id,)).fetchall()
+        to_delete += [row[0] + '.jpg' for row in rows]
+
+    gevent.spawn(delete_thumbnails, to_delete)
     cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
 
 def _get_videos(cursor, number, offset):
-- 
cgit v1.2.3


From 5a6c65774bf44ce4b2dadf3523a9125aa851561a Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 17:27:55 -0700
Subject: Fix bug when thumbnail directory doesn't exist where first downloaded
 thumbnail is made a directory

---
 youtube/subscriptions.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 3a0ef49..8937a96 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -553,7 +553,7 @@ def serve_subscription_thumbnail(thumbnail):
         try:
             f = open(thumbnail_path, 'wb')
         except FileNotFoundError:
-            os.makedirs(thumbnail_path, exist_ok = True)
+            os.makedirs(thumbnails_directory, exist_ok = True)
             f = open(thumbnail_path, 'wb')
         f.write(image)
         f.close()
-- 
cgit v1.2.3


From a12b73439a5d81ea4052ec33177fc5a61124017e Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 17:37:42 -0700
Subject: If thumbnail or thumbnail directory is deleted after having been
 downloaded, correctly detect it and redownload it

---
 youtube/subscriptions.py | 39 +++++++++++++++++++++++----------------
 1 file changed, 23 insertions(+), 16 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 8937a96..9016844 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -536,30 +536,37 @@ def post_subscriptions_page():
 
 @yt_app.route('/data/subscription_thumbnails/<thumbnail>')
 def serve_subscription_thumbnail(thumbnail):
+    '''Serves thumbnail from disk if it's been saved already. If not, downloads the thumbnail, saves to disk, and serves it.'''
     assert thumbnail[-4:] == '.jpg'
     video_id = thumbnail[0:-4]
     thumbnail_path = os.path.join(thumbnails_directory, thumbnail)
 
     if video_id in existing_thumbnails:
-        # .. is necessary because flask always uses the application directory at ./youtube, not the working directory
-        return flask.send_from_directory(os.path.join('..', thumbnails_directory), thumbnail)
-    else:
-        url = "https://i.ytimg.com/vi/" + video_id + "/mqdefault.jpg"
-        try:
-            image = util.fetch_url(url, report_text="Saved thumbnail: " + video_id)
-        except urllib.error.HTTPError as e:
-            print("Failed to download thumbnail for " + video_id + ": " + str(e))
-            abort(e.code)
         try:
-            f = open(thumbnail_path, 'wb')
+            f = open(thumbnail_path, 'rb')
         except FileNotFoundError:
-            os.makedirs(thumbnails_directory, exist_ok = True)
-            f = open(thumbnail_path, 'wb')
-        f.write(image)
-        f.close()
-        existing_thumbnails.add(video_id)
+            existing_thumbnails.remove(video_id)
+        else:
+            image = f.read()
+            f.close()
+            return flask.Response(image, mimetype='image/jpeg')
 
-        return flask.Response(image, mimetype='image/jpeg')
+    url = "https://i.ytimg.com/vi/" + video_id + "/mqdefault.jpg"
+    try:
+        image = util.fetch_url(url, report_text="Saved thumbnail: " + video_id)
+    except urllib.error.HTTPError as e:
+        print("Failed to download thumbnail for " + video_id + ": " + str(e))
+        abort(e.code)
+    try:
+        f = open(thumbnail_path, 'wb')
+    except FileNotFoundError:
+        os.makedirs(thumbnails_directory, exist_ok = True)
+        f = open(thumbnail_path, 'wb')
+    f.write(image)
+    f.close()
+    existing_thumbnails.add(video_id)
+
+    return flask.Response(image, mimetype='image/jpeg')
 
 
-- 
cgit v1.2.3


From d1ae8dc290e294a7f0a4d1fc485479a0236a2345 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 17:44:11 -0700
Subject: Subscriptions flask port: add missing html info (video url and info
 dict)

---
 youtube/subscriptions.py | 1 +
 1 file changed, 1 insertion(+)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 9016844..ba1f334 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -486,6 +486,7 @@ def get_subscriptions_page():
                 video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
                 video['type'] = 'video'
                 video['item_size'] = 'small'
+                yt_data_extract.add_extra_html_info(video)
                 videos.append(video)
 
             tags = _get_all_tags(cursor)
-- 
cgit v1.2.3


From b469536ce6cbdcdfd966a15aa1ce45d8f5b42db9 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 18:17:19 -0700
Subject: Ability to only show videos from channels with specific tag

---
 youtube/subscriptions.py             | 24 +++++++++++++++++-------
 youtube/templates/subscriptions.html |  2 +-
 2 files changed, 18 insertions(+), 8 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index ba1f334..3cb02ff 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -120,12 +120,21 @@ def _unsubscribe(cursor, channel_ids):
     gevent.spawn(delete_thumbnails, to_delete)
     cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
 
-def _get_videos(cursor, number, offset):
-    db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
-                                  FROM videos
-                                  INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
-                                  ORDER BY time_published DESC
-                                  LIMIT ? OFFSET ?''', (number, offset))
+def _get_videos(cursor, number, offset, tag = None):
+    if tag is not None:
+        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+                                      FROM videos
+                                      INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
+                                      INNER JOIN tag_associations on videos.sql_channel_id = tag_associations.sql_channel_id
+                                      WHERE tag = ?
+                                      ORDER BY time_published DESC
+                                      LIMIT ? OFFSET ?''', (tag, number, offset))
+    else:
+        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+                                      FROM videos
+                                      INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
+                                      ORDER BY time_published DESC
+                                      LIMIT ? OFFSET ?''', (number, offset))
 
     for db_video in db_videos:
         yield {
@@ -481,8 +490,9 @@ def post_subscription_manager_page():
 def get_subscriptions_page():
     with open_database() as connection:
         with connection as cursor:
+            tag = request.args.get('tag', None)
             videos = []
-            for video in _get_videos(cursor, 60, 0):
+            for video in _get_videos(cursor, 60, 0, tag):
                 video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
                 video['type'] = 'video'
                 video['item_size'] = 'small'
diff --git a/youtube/templates/subscriptions.html b/youtube/templates/subscriptions.html
index a3227b1..442bd88 100644
--- a/youtube/templates/subscriptions.html
+++ b/youtube/templates/subscriptions.html
@@ -64,7 +64,7 @@
         <ol class="sidebar-list tags">
             {% for tag in tags %}
                 <li class="sidebar-list-item">
-                    <span class="sidebar-item-name">{{ tag }}</span>
+                    <a href="?tag={{ tag|urlencode }}" class="sidebar-item-name">{{ tag }}</a>
                     <form method="POST" class="sidebar-item-refresh">
                         <input type="submit" value="Check">
                         <input type="hidden" name="action" value="refresh">
-- 
cgit v1.2.3


From c55955f42d5fff886892f5d0093ee2725a911b02 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sun, 11 Aug 2019 18:36:44 -0700
Subject: Set sqlite to respect foreign key constraints

---
 youtube/subscriptions.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 3cb02ff..2c7b1fa 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -27,9 +27,10 @@ def open_database():
         os.makedirs(settings.data_dir)
     connection = sqlite3.connect(database_path, check_same_thread=False)
 
-    # Create tables if they don't exist
     try:
         cursor = connection.cursor()
+        cursor.execute('''PRAGMA foreign_keys = 1''')
+        # Create tables if they don't exist
         cursor.execute('''CREATE TABLE IF NOT EXISTS subscribed_channels (
                               id integer PRIMARY KEY,
                               yt_channel_id text UNIQUE NOT NULL,
-- 
cgit v1.2.3


From dd4841901f676fff619d9cf794c37a35e202bda6 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 12 Aug 2019 01:14:11 -0700
Subject: Add pagination to subscriptions page

---
 youtube/subscriptions.py             | 38 +++++++++++++++++++++++++++---------
 youtube/templates/subscriptions.html | 24 ++++++++++++++---------
 2 files changed, 44 insertions(+), 18 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 2c7b1fa..5a957ac 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -11,6 +11,7 @@ import traceback
 import contextlib
 import defusedxml.ElementTree
 import urllib
+import math
 
 import flask
 from flask import request
@@ -121,7 +122,16 @@ def _unsubscribe(cursor, channel_ids):
     gevent.spawn(delete_thumbnails, to_delete)
     cursor.executemany("DELETE FROM subscribed_channels WHERE yt_channel_id=?", ((channel_id, ) for channel_id in channel_ids))
 
-def _get_videos(cursor, number, offset, tag = None):
+def _get_videos(cursor, number_per_page, offset, tag = None):
+    '''Returns a full page of videos with an offset, and a value good enough to be used as the total number of videos'''
+    # We ask for the next 9 pages from the database
+    # Then the actual length of the results tell us if there are more than 9 pages left, and if not, how many there actually are
+    # This is done since there are only 9 page buttons on display at a time
+    # If there are more than 9 pages left, we give a fake value in place of the real number of results if the entire database was queried without limit
+    # This fake value is sufficient to get the page button generation macro to display 9 page buttons
+    # If we wish to display more buttons this logic must change
+    # We cannot use tricks with the sql id for the video since we frequently have filters and other restrictions in place on the results anyway
+    # TODO: This is probably not the ideal solution
     if tag is not None:
         db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
                                       FROM videos
@@ -129,21 +139,29 @@ def _get_videos(cursor, number, offset, tag = None):
                                       INNER JOIN tag_associations on videos.sql_channel_id = tag_associations.sql_channel_id
                                       WHERE tag = ?
                                       ORDER BY time_published DESC
-                                      LIMIT ? OFFSET ?''', (tag, number, offset))
+                                      LIMIT ? OFFSET ?''', (tag, number_per_page*9, offset)).fetchall()
     else:
         db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       ORDER BY time_published DESC
-                                      LIMIT ? OFFSET ?''', (number, offset))
+                                      LIMIT ? OFFSET ?''', (number_per_page*9, offset)).fetchall()
 
-    for db_video in db_videos:
-        yield {
+    pseudo_number_of_videos = offset + len(db_videos)
+
+    videos = []
+    for db_video in db_videos[0:number_per_page]:
+        videos.append({
             'id':   db_video[0],
             'title':    db_video[1],
             'duration': db_video[2],
             'author':   db_video[3],
-        }
+        })
+
+    return videos, pseudo_number_of_videos
+
+
+
 
 def _get_subscribed_channels(cursor):
     for item in cursor.execute('''SELECT channel_name, yt_channel_id, muted
@@ -489,16 +507,16 @@ def post_subscription_manager_page():
 @yt_app.route('/subscriptions', methods=['GET'])
 @yt_app.route('/feed/subscriptions', methods=['GET'])
 def get_subscriptions_page():
+    page = int(request.args.get('page', 1))
     with open_database() as connection:
         with connection as cursor:
             tag = request.args.get('tag', None)
-            videos = []
-            for video in _get_videos(cursor, 60, 0, tag):
+            videos, number_of_videos_in_db = _get_videos(cursor, 60, (page - 1)*60, tag)
+            for video in videos:
                 video['thumbnail'] = util.URL_ORIGIN + '/data/subscription_thumbnails/' + video['id'] + '.jpg'
                 video['type'] = 'video'
                 video['item_size'] = 'small'
                 yt_data_extract.add_extra_html_info(video)
-                videos.append(video)
 
             tags = _get_all_tags(cursor)
 
@@ -514,6 +532,8 @@ def get_subscriptions_page():
 
     return flask.render_template('subscriptions.html',
         videos = videos,
+        num_pages = math.ceil(number_of_videos_in_db/60),
+        parameters_dictionary = request.args,
         tags = tags,
         subscription_list = subscription_list,
     )
diff --git a/youtube/templates/subscriptions.html b/youtube/templates/subscriptions.html
index 442bd88..b4b87f0 100644
--- a/youtube/templates/subscriptions.html
+++ b/youtube/templates/subscriptions.html
@@ -7,9 +7,12 @@
         display:flex;
         flex-direction: row;
     }
-    .item-grid{
+    .video-section{
         flex-grow: 1;
     }
+        .video-section .page-button-row{
+            justify-content: center;
+        }
     .subscriptions-sidebar{
         flex-basis: 300px;
         background-color: #dadada;
@@ -44,11 +47,17 @@
 {% endblock style %}
 
 {% block main %}
-    <nav class="item-grid">
-        {% for video_info in videos %}
-            {{ common_elements.item(video_info, include_author=false) }}
-        {% endfor %}
-    </nav>
+    <div class="video-section">
+        <nav class="item-grid">
+            {% for video_info in videos %}
+                {{ common_elements.item(video_info, include_author=false) }}
+            {% endfor %}
+        </nav>
+
+        <nav class="page-button-row">
+            {{ common_elements.page_buttons(num_pages, '/youtube.com/subscriptions', parameters_dictionary) }}
+        </nav>
+    </div>
 
     <div class="subscriptions-sidebar">
         <div class="sidebar-links">
@@ -91,7 +100,4 @@
 
     </div>
 
-    <nav class="page-button-row">
-        {# TODO #}
-    </nav>
 {% endblock main %}
-- 
cgit v1.2.3


From de33ee6bb87aeff4bdc01a995c24515894a6a3a8 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 12 Aug 2019 15:09:28 -0700
Subject: When restricting subscriptions to a tag, make that tag unclickable
 and add link to unrestrict

---
 youtube/subscriptions.py             |  1 +
 youtube/templates/subscriptions.html | 12 +++++++++++-
 2 files changed, 12 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 5a957ac..64a72f4 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -535,6 +535,7 @@ def get_subscriptions_page():
         num_pages = math.ceil(number_of_videos_in_db/60),
         parameters_dictionary = request.args,
         tags = tags,
+        current_tag = tag,
         subscription_list = subscription_list,
     )
 
diff --git a/youtube/templates/subscriptions.html b/youtube/templates/subscriptions.html
index b4b87f0..62ed681 100644
--- a/youtube/templates/subscriptions.html
+++ b/youtube/templates/subscriptions.html
@@ -71,9 +71,19 @@
 
         <hr>
         <ol class="sidebar-list tags">
+            {% if current_tag %}
+                <li class="sidebar-list-item">
+                    <a href="/youtube.com/subscriptions" class="sidebar-item-name">Any tag</a>
+                </li>
+            {% endif %}
+
             {% for tag in tags %}
                 <li class="sidebar-list-item">
-                    <a href="?tag={{ tag|urlencode }}" class="sidebar-item-name">{{ tag }}</a>
+                    {% if tag == current_tag %}
+                        <span class="sidebar-item-name">{{ tag }}</span>
+                    {% else %}
+                        <a href="?tag={{ tag|urlencode }}" class="sidebar-item-name">{{ tag }}</a>
+                    {% endif %}
                     <form method="POST" class="sidebar-item-refresh">
                         <input type="submit" value="Check">
                         <input type="hidden" name="action" value="refresh">
-- 
cgit v1.2.3


From da8243085b30ff44b226dd177ab8bca755e1c48b Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 12 Aug 2019 15:18:56 -0700
Subject: subscription_manager: fix bug where checkbox size decreases when
 there's too many tags

---
 youtube/templates/subscription_manager.html | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/templates/subscription_manager.html b/youtube/templates/subscription_manager.html
index 838f4af..eb52eef 100644
--- a/youtube/templates/subscription_manager.html
+++ b/youtube/templates/subscription_manager.html
@@ -69,7 +69,7 @@
             }
             .sub-list-checkbox{
                 height: 1.5em;
-                width: 1.5em;
+                min-width: 1.5em;   // need min-width otherwise browser doesn't respect the width and squishes the checkbox down when there's too many tags
             }
         .muted{
             background-color: #888888;
-- 
cgit v1.2.3


From 38792081d45d99377f5d472a31133e90a0f5d631 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 12 Aug 2019 15:34:55 -0700
Subject: subscription-manager: fix items being cut off at the bottom and top
 of the columns in chrome

---
 youtube/templates/subscription_manager.html | 1 +
 1 file changed, 1 insertion(+)

(limited to 'youtube')

diff --git a/youtube/templates/subscription_manager.html b/youtube/templates/subscription_manager.html
index eb52eef..3145f54 100644
--- a/youtube/templates/subscription_manager.html
+++ b/youtube/templates/subscription_manager.html
@@ -58,6 +58,7 @@
         .sub-list-item{
             display:flex;
             margin-bottom: 10px;
+            break-inside:avoid;
             background-color: #dadada;
         }
             .tag-list{
-- 
cgit v1.2.3


From 31a04555aeee7e9bdaf770ab8f9252990a874890 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Wed, 14 Aug 2019 00:12:24 -0700
Subject: Subscriptions auto-checking system

---
 youtube/subscriptions.py | 92 +++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 88 insertions(+), 4 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 64a72f4..60d5531 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -12,6 +12,7 @@ import contextlib
 import defusedxml.ElementTree
 import urllib
 import math
+import secrets
 
 import flask
 from flask import request
@@ -37,8 +38,8 @@ def open_database():
                               yt_channel_id text UNIQUE NOT NULL,
                               channel_name text NOT NULL,
                               time_last_checked integer,
-                              muted integer DEFAULT 0,
-                              upload_frequency integer
+                              next_check_time integer,
+                              muted integer DEFAULT 0
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
                               id integer PRIMARY KEY,
@@ -227,6 +228,11 @@ def _channels_with_tag(cursor, tag, order=False, exclude_muted=False, include_mu
 
     return cursor.execute(statement, [tag]).fetchall()
 
+def _schedule_checking(cursor, channel_id, next_check_time):
+    cursor.execute('''UPDATE subscribed_channels SET next_check_time = ? WHERE yt_channel_id = ?''', [int(next_check_time), channel_id])
+
+def _is_muted(cursor, channel_id):
+    return bool(cursor.execute('''SELECT muted FROM subscribed_channels WHERE yt_channel_id=?''', [channel_id]).fetchone()[0])
 
 units = {
     'year': 31536000,   # 365*24*3600
@@ -257,6 +263,9 @@ except FileNotFoundError:
     existing_thumbnails = set()
 
 
+# --- Manual checking system. Rate limited in order to support very large numbers of channels to be checked ---
+# Auto checking system plugs into this for convenience, though it doesn't really need the rate limiting
+
 check_channels_queue = util.RateLimitedQueue()
 checking_channels = set()
 
@@ -273,8 +282,65 @@ def check_channel_worker():
 
 for i in range(0,5):
     gevent.spawn(check_channel_worker)
+# ----------------------------
+
+
+
+# --- Auto checking system ---
+
+if settings.autocheck_subscriptions:
+    # job application format: dict with keys (channel_id, channel_name, next_check_time)
+    autocheck_job_application = gevent.queue.Queue() # only really meant to hold 1 item, just reusing gevent's wait and timeout machinery
+
+    autocheck_jobs = [] # list of dicts with the keys (channel_id, channel_name, next_check_time). Stores all the channels that need to be autochecked and when to check them
+    with open_database() as connection:
+        with connection as cursor:
+            now = time.time()
+            for row in cursor.execute('''SELECT yt_channel_id, channel_name, next_check_time FROM subscribed_channels WHERE next_check_time IS NOT NULL AND muted != 1''').fetchall():
+                if row[2] < now:    # expired, check randomly within the 30 minutes
+                    next_check_time = now + 3600*secrets.randbelow(60)/60
+                    row = (row[0], row[1], next_check_time)
+                    _schedule_checking(cursor, row[0], next_check_time)
+                autocheck_jobs.append({'channel_id': row[0], 'channel_name': row[1], 'next_check_time': row[2]})
+
+
+
+    def autocheck_dispatcher():
+        '''Scans the auto_check_list. Sleeps until the earliest job is due, then adds that channel to the checking queue above. Can be sent a new job through autocheck_job_application'''
+        while True:
+            if len(autocheck_jobs) == 0:
+                new_job = autocheck_job_application.get()
+                autocheck_jobs.append(new_job)
+            else:
+                earliest_job_index = min(range(0, len(autocheck_jobs)), key=lambda index: autocheck_jobs[index]['next_check_time']) # https://stackoverflow.com/a/11825864
+                earliest_job = autocheck_jobs[earliest_job_index]
+                time_until_earliest_job = earliest_job['next_check_time'] - time.time()
+
+                if time_until_earliest_job <= 0:
+                    print('ERROR: autocheck_dispatcher got job scheduled in the past, skipping and rescheduling: ' + earliest_job['channel_id'] + ', ' + earliest_job['channel_name'] + ', ' + str(earliest_job['next_check_time']))
+                    next_check_time = time.time() + 3600*secrets.randbelow(60)/60
+                    with_open_db(_schedule_checking, earliest_job['channel_id'], next_check_time)
+                    autocheck_jobs[earliest_job_index]['next_check_time'] = next_check_time
+                    continue
+
+                # make sure it's not muted
+                if with_open_db(_is_muted, earliest_job['channel_id']):
+                    del autocheck_jobs[earliest_job_index]
+                    continue
+
+                try:
+                    new_job = autocheck_job_application.get(timeout = time_until_earliest_job)  # sleep for time_until_earliest_job time, but allow to be interrupted by new jobs
+                except gevent.queue.Empty: # no new jobs, time to execute the earliest job
+                    channel_names[earliest_job['channel_id']] = earliest_job['channel_name']
+                    checking_channels.add(earliest_job['channel_id'])
+                    check_channels_queue.put(earliest_job['channel_id'])
+                    del autocheck_jobs[earliest_job_index]
+                else: # new job, add it to the list
+                    autocheck_jobs.append(new_job)
 
 
+    gevent.spawn(autocheck_dispatcher)
+# ----------------------------
 
 
@@ -305,13 +371,31 @@ def _get_upstream_videos(channel_id):
         videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['description']))
 
 
+    if len(videos) == 0:
+        average_upload_period = 4*7*24*3600 # assume 1 month for channel with no videos
+    elif len(videos) < 5:
+        average_upload_period = int((time.time() - videos[len(videos)-1][4])/len(videos))
+    else:
+        average_upload_period = int((time.time() - videos[4][4])/5) # equivalent to averaging the time between videos for the last 5 videos
+
+    # calculate when to check next for auto checking
+    # add some quantization and randomness to make pattern analysis by Youtube slightly harder
+    quantized_upload_period = average_upload_period - (average_upload_period % (4*3600)) + 4*3600   # round up to nearest 4 hours
+    randomized_upload_period = quantized_upload_period*(1 + secrets.randbelow(50)/50*0.5) # randomly between 1x and 1.5x
+    next_check_delay = randomized_upload_period/5    # check at 5x the channel posting rate. might want to fine tune this number
+    next_check_time = int(time.time() + next_check_delay)
+
     with open_database() as connection:
         with connection as cursor:
             cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description)
                                   VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?)''', videos)
             cursor.execute('''UPDATE subscribed_channels
-                              SET time_last_checked = ?
-                              WHERE yt_channel_id=?''', [int(time.time()), channel_id])
+                              SET time_last_checked = ?, next_check_time = ?
+                              WHERE yt_channel_id=?''', [int(time.time()), next_check_time, channel_id])
+
+            if settings.autocheck_subscriptions:
+                if not _is_muted(cursor, channel_id):
+                    autocheck_job_application.put({'channel_id': channel_id, 'channel_name': channel_names[channel_id], 'next_check_time': next_check_time})
 
 
 def check_all_channels():
-- 
cgit v1.2.3


From e69ea5910f4e195a65940c6de2ae521e8d821c85 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Wed, 14 Aug 2019 00:14:27 -0700
Subject: subscriptions.html: Add horizontal rule between tag list and channel
 list

---
 youtube/templates/subscriptions.html | 3 +++
 1 file changed, 3 insertions(+)

(limited to 'youtube')

diff --git a/youtube/templates/subscriptions.html b/youtube/templates/subscriptions.html
index 62ed681..fa6b5bf 100644
--- a/youtube/templates/subscriptions.html
+++ b/youtube/templates/subscriptions.html
@@ -70,6 +70,7 @@
         </div>
 
         <hr>
+
         <ol class="sidebar-list tags">
             {% if current_tag %}
                 <li class="sidebar-list-item">
@@ -94,6 +95,8 @@
             {% endfor %}
         </ol>
 
+        <hr>
+
         <ol class="sidebar-list sub-refresh-list">
             {% for subscription in subscription_list %}
                 <li class="sidebar-list-item {{ 'muted' if subscription['muted'] else '' }}">
-- 
cgit v1.2.3


From e2c9081aee4730a36228998354d6568f1c206df9 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Wed, 14 Aug 2019 16:40:42 -0700
Subject: Subscriptions: double auto-check rate

---
 youtube/subscriptions.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 60d5531..27cc5c7 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -382,7 +382,7 @@ def _get_upstream_videos(channel_id):
     # add some quantization and randomness to make pattern analysis by Youtube slightly harder
     quantized_upload_period = average_upload_period - (average_upload_period % (4*3600)) + 4*3600   # round up to nearest 4 hours
     randomized_upload_period = quantized_upload_period*(1 + secrets.randbelow(50)/50*0.5) # randomly between 1x and 1.5x
-    next_check_delay = randomized_upload_period/5    # check at 5x the channel posting rate. might want to fine tune this number
+    next_check_delay = randomized_upload_period/10    # check at 10x the channel posting rate. might want to fine tune this number
     next_check_time = int(time.time() + next_check_delay)
 
     with open_database() as connection:
-- 
cgit v1.2.3


From 046d7226eaa3087159e64310bfa1b5e359cd2e93 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Wed, 14 Aug 2019 18:39:39 -0700
Subject: Subscriptions: improve checking messages, say how many new vids from
 channel

---
 youtube/channel.py       |  8 +++++---
 youtube/subscriptions.py | 34 +++++++++++++++++++++++++++++++---
 2 files changed, 36 insertions(+), 6 deletions(-)

(limited to 'youtube')

diff --git a/youtube/channel.py b/youtube/channel.py
index 9d0532a..de75eaa 100644
--- a/youtube/channel.py
+++ b/youtube/channel.py
@@ -83,13 +83,15 @@ def channel_ctoken(channel_id, page, sort, tab, view=1):
 
     return base64.urlsafe_b64encode(pointless_nest).decode('ascii')
 
-def get_channel_tab(channel_id, page="1", sort=3, tab='videos', view=1):
+def get_channel_tab(channel_id, page="1", sort=3, tab='videos', view=1, print_status=True):
     ctoken = channel_ctoken(channel_id, page, sort, tab, view).replace('=', '%3D')
     url = "https://www.youtube.com/browse_ajax?ctoken=" + ctoken
 
-    print("Sending channel tab ajax request")
+    if print_status:
+        print("Sending channel tab ajax request")
     content = util.fetch_url(url, util.desktop_ua + headers_1, debug_name='channel_tab')
-    print("Finished recieving channel tab response")
+    if print_status:
+        print("Finished recieving channel tab response")
 
     return content
 
diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 27cc5c7..739b2c5 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -354,13 +354,15 @@ def check_channels_if_necessary(channel_ids):
 
 def _get_upstream_videos(channel_id):
     try:
-        print("Checking channel: " + channel_names[channel_id])
+        channel_status_name = channel_names[channel_id]
     except KeyError:
-        print("Checking channel " + channel_id)
+        channel_status_name = channel_id
+
+    print("Checking channel: " + channel_status_name)
 
     videos = []
 
-    channel_videos = channel.extract_info(json.loads(channel.get_channel_tab(channel_id)), 'videos')['items']
+    channel_videos = channel.extract_info(json.loads(channel.get_channel_tab(channel_id, print_status=False)), 'videos')['items']
     for i, video_item in enumerate(channel_videos):
         if 'description' not in video_item:
             video_item['description'] = ''
@@ -387,6 +389,24 @@ def _get_upstream_videos(channel_id):
 
     with open_database() as connection:
         with connection as cursor:
+            # calculate how many new videos there are
+            row = cursor.execute('''SELECT video_id
+                                    FROM videos
+                                    INNER JOIN subscribed_channels ON videos.sql_channel_id = subscribed_channels.id
+                                    WHERE yt_channel_id=?
+                                    ORDER BY time_published DESC
+                                    LIMIT 1''', [channel_id]).fetchone()
+            if row is None:
+                number_of_new_videos = len(videos)
+            else:
+                latest_video_id = row[0]
+                index = 0
+                for video in videos:
+                    if video[1] == latest_video_id:
+                        break
+                    index += 1
+                number_of_new_videos = index
+
             cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description)
                                   VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?)''', videos)
             cursor.execute('''UPDATE subscribed_channels
@@ -397,6 +417,14 @@ def _get_upstream_videos(channel_id):
                 if not _is_muted(cursor, channel_id):
                     autocheck_job_application.put({'channel_id': channel_id, 'channel_name': channel_names[channel_id], 'next_check_time': next_check_time})
 
+    if number_of_new_videos == 0:
+        print('No new videos from ' + channel_status_name)
+    elif number_of_new_videos == 1:
+        print('1 new video from ' + channel_status_name)
+    else:
+        print(str(number_of_new_videos) + ' new videos from ' + channel_status_name)
+
+
 
 def check_all_channels():
     with open_database() as connection:
-- 
cgit v1.2.3


From 899b088cdcbfea988d79b38116d658096eafdc8b Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Fri, 16 Aug 2019 21:48:40 -0700
Subject: Subscriptions: show when video was published

---
 youtube/subscriptions.py               | 53 ++++++++++++++++++++++++----------
 youtube/templates/common_elements.html |  4 ++-
 2 files changed, 41 insertions(+), 16 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 739b2c5..4281dde 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -13,6 +13,7 @@ import defusedxml.ElementTree
 import urllib
 import math
 import secrets
+import collections
 
 import flask
 from flask import request
@@ -48,6 +49,7 @@ def open_database():
                               title text NOT NULL,
                               duration text,
                               time_published integer NOT NULL,
+                              is_time_published_exact integer DEFAULT 0,
                               description text
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS tag_associations (
@@ -134,7 +136,7 @@ def _get_videos(cursor, number_per_page, offset, tag = None):
     # We cannot use tricks with the sql id for the video since we frequently have filters and other restrictions in place on the results anyway
     # TODO: This is probably not the ideal solution
     if tag is not None:
-        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+        db_videos = cursor.execute('''SELECT video_id, title, duration, time_published, is_time_published_exact, channel_name
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       INNER JOIN tag_associations on videos.sql_channel_id = tag_associations.sql_channel_id
@@ -142,7 +144,7 @@ def _get_videos(cursor, number_per_page, offset, tag = None):
                                       ORDER BY time_published DESC
                                       LIMIT ? OFFSET ?''', (tag, number_per_page*9, offset)).fetchall()
     else:
-        db_videos = cursor.execute('''SELECT video_id, title, duration, channel_name
+        db_videos = cursor.execute('''SELECT video_id, title, duration, time_published, is_time_published_exact, channel_name
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       ORDER BY time_published DESC
@@ -156,7 +158,8 @@ def _get_videos(cursor, number_per_page, offset, tag = None):
             'id':   db_video[0],
             'title':    db_video[1],
             'duration': db_video[2],
-            'author':   db_video[3],
+            'published': exact_timestamp(db_video[3]) if db_video[4] else posix_to_dumbed_down(db_video[3]),
+            'author':   db_video[5],
         })
 
     return videos, pseudo_number_of_videos
@@ -234,15 +237,15 @@ def _schedule_checking(cursor, channel_id, next_check_time):
 def _is_muted(cursor, channel_id):
     return bool(cursor.execute('''SELECT muted FROM subscribed_channels WHERE yt_channel_id=?''', [channel_id]).fetchone()[0])
 
-units = {
-    'year': 31536000,   # 365*24*3600
-    'month': 2592000,   # 30*24*3600
-    'week': 604800,     # 7*24*3600
-    'day':  86400,      # 24*3600
-    'hour': 3600,
-    'minute': 60,
-    'second': 1,
-}
+units = collections.OrderedDict([
+    ('year', 31536000),   # 365*24*3600
+    ('month', 2592000),   # 30*24*3600
+    ('week', 604800),     # 7*24*3600
+    ('day',  86400),      # 24*3600
+    ('hour', 3600),
+    ('minute', 60),
+    ('second', 1),
+])
 def youtube_timestamp_to_posix(dumb_timestamp):
     ''' Given a dumbed down timestamp such as 1 year ago, 3 hours ago,
          approximates the unix time (seconds since 1/1/1970) '''
@@ -251,11 +254,31 @@ def youtube_timestamp_to_posix(dumb_timestamp):
     if dumb_timestamp == "just now":
         return now
     split = dumb_timestamp.split(' ')
-    number, unit = int(split[0]), split[1]
-    if number > 1:
+    quantifier, unit = int(split[0]), split[1]
+    if quantifier > 1:
         unit = unit[:-1]    # remove s from end
-    return now - number*units[unit]
+    return now - quantifier*units[unit]
 
+def posix_to_dumbed_down(posix_time):
+    '''Inverse of youtube_timestamp_to_posix.'''
+    delta = int(time.time() - posix_time)
+    assert delta >= 0
+
+    if delta == 0:
+        return '0 seconds ago'
+
+    for unit_name, unit_time in units.items():
+        if delta >= unit_time:
+            quantifier = round(delta/unit_time)
+            if quantifier == 1:
+                return '1 ' + unit_name + ' ago'
+            else:
+                return str(quantifier) + ' ' + unit_name + 's ago'
+    else:
+        raise Exception()
+
+def exact_timestamp(posix_time):
+    return time.strftime('%m/%d/%y %I:%M %p', time.localtime(posix_time))
 
 try:
     existing_thumbnails = set(os.path.splitext(name)[0] for name in os.listdir(thumbnails_directory))
diff --git a/youtube/templates/common_elements.html b/youtube/templates/common_elements.html
index 49e2fad..b8f5c51 100644
--- a/youtube/templates/common_elements.html
+++ b/youtube/templates/common_elements.html
@@ -26,7 +26,9 @@
                 
                 <address>{{ info['author'] }}</address>
                 <span class="views">{{ info['views'] }}</span>
-
+                {% if 'views' is not in(info) and 'published' is in(info) %}
+                    <time>{{ info['published'] }}</time>
+                {% endif %}
             {% elif info['type'] == 'playlist' %}
                 <a class="playlist-thumbnail-box" href="{{ info['url'] }}" title="{{ info['title'] }}">
                     <img class="playlist-thumbnail-img" src="{{ info['thumbnail'] }}">
-- 
cgit v1.2.3


From 056f6fd2b5c4d6e4f387a73be1bd7c0207f834b3 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 17 Aug 2019 00:50:58 -0700
Subject: Subscriptions: check channel's atom feed to get exact time published

---
 youtube/subscriptions.py | 71 ++++++++++++++++++++++++++++++++++++++++++------
 1 file changed, 62 insertions(+), 9 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 4281dde..6150afe 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -14,6 +14,7 @@ import urllib
 import math
 import secrets
 import collections
+import calendar # bullshit! https://bugs.python.org/issue6280
 
 import flask
 from flask import request
@@ -278,7 +279,10 @@ def posix_to_dumbed_down(posix_time):
         raise Exception()
 
 def exact_timestamp(posix_time):
-    return time.strftime('%m/%d/%y %I:%M %p', time.localtime(posix_time))
+    result = time.strftime('%I:%M %p %m/%d/%y', time.localtime(posix_time))
+    if result[0] == '0':    # remove 0 infront of hour (like 01:00 PM)
+        return result[1:]
+    return result
 
 try:
     existing_thumbnails = set(os.path.splitext(name)[0] for name in os.listdir(thumbnails_directory))
@@ -385,15 +389,64 @@ def _get_upstream_videos(channel_id):
 
     videos = []
 
-    channel_videos = channel.extract_info(json.loads(channel.get_channel_tab(channel_id, print_status=False)), 'videos')['items']
+    tasks = (
+        gevent.spawn(channel.get_channel_tab, channel_id, print_status=False), # channel page, need for video duration
+        gevent.spawn(util.fetch_url, 'https://www.youtube.com/feeds/videos.xml?channel_id=' + channel_id) # atoma feed, need for exact published time
+    )
+    gevent.joinall(tasks)
+
+    channel_tab, feed = tasks[0].value, tasks[1].value
+
+    # extract published times from atoma feed
+    times_published = {}
+    try:
+        def remove_bullshit(tag):
+            '''Remove XML namespace bullshit from tagname. https://bugs.python.org/issue18304'''
+            if '}' in tag:
+                return tag[tag.rfind('}')+1:]
+            return tag
+
+        def find_element(base, tag_name):
+            for element in base:
+                if remove_bullshit(element.tag) == tag_name:
+                    return element
+            return None
+
+        root = defusedxml.ElementTree.fromstring(feed.decode('utf-8'))
+        assert remove_bullshit(root.tag) == 'feed'
+        for entry in root:
+            if (remove_bullshit(entry.tag) != 'entry'):
+                continue
+
+            # it's yt:videoId in the xml but the yt: is turned into a namespace which is removed by remove_bullshit
+            video_id_element = find_element(entry, 'videoId')
+            time_published_element = find_element(entry, 'published')
+            assert video_id_element is not None
+            assert time_published_element is not None
+
+            time_published = int(calendar.timegm(time.strptime(time_published_element.text, '%Y-%m-%dT%H:%M:%S+00:00')))
+            times_published[video_id_element.text] = time_published
+
+    except (AssertionError, defusedxml.ElementTree.ParseError) as e:
+        print('Failed to read atoma feed for ' + channel_status_name)
+        traceback.print_exc()
+
+
+    channel_videos = channel.extract_info(json.loads(channel_tab), 'videos')['items']
     for i, video_item in enumerate(channel_videos):
         if 'description' not in video_item:
             video_item['description'] = ''
-        try:
-            video_item['time_published'] = youtube_timestamp_to_posix(video_item['published']) - i  # subtract a few seconds off the videos so they will be in the right order
-        except KeyError:
-            print(video_item)
-        videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['description']))
+
+        if video_item['id'] in times_published:
+            video_item['time_published'] = times_published[video_item['id']]
+            video_item['is_time_published_exact'] = True
+        else:
+            video_item['is_time_published_exact'] = False
+            try:
+                video_item['time_published'] = youtube_timestamp_to_posix(video_item['published']) - i  # subtract a few seconds off the videos so they will be in the right order
+            except KeyError:
+                print(video_item)
+        videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['is_time_published_exact'], video_item['description']))
 
 
     if len(videos) == 0:
@@ -430,8 +483,8 @@ def _get_upstream_videos(channel_id):
                     index += 1
                 number_of_new_videos = index
 
-            cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, description)
-                                  VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?)''', videos)
+            cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, is_time_published_exact, description)
+                                  VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?, ?)''', videos)
             cursor.execute('''UPDATE subscribed_channels
                               SET time_last_checked = ?, next_check_time = ?
                               WHERE yt_channel_id=?''', [int(time.time()), next_check_time, channel_id])
-- 
cgit v1.2.3


From 897755e836f5ac043a683ac44e9f047184b63f6e Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 17 Aug 2019 12:49:36 -0700
Subject: Subscriptions: Add database version

---
 youtube/subscriptions.py | 3 +++
 1 file changed, 3 insertions(+)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 6150afe..26958d0 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -59,6 +59,9 @@ def open_database():
                               sql_channel_id integer NOT NULL REFERENCES subscribed_channels(id) ON UPDATE CASCADE ON DELETE CASCADE,
                               UNIQUE(tag, sql_channel_id)
                           )''')
+        cursor.execute('''CREATE TABLE IF NOT EXISTS db_info (
+                              version integer DEFAULT 1
+                          )''')
 
         connection.commit()
     except:
-- 
cgit v1.2.3


From aa5b9efca11f4fe52f176f378bd6ed96290ad9d0 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 17 Aug 2019 12:54:03 -0700
Subject: Subscriptions: Don't show videos from muted channels

---
 youtube/subscriptions.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 26958d0..a4fef5a 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -144,13 +144,14 @@ def _get_videos(cursor, number_per_page, offset, tag = None):
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       INNER JOIN tag_associations on videos.sql_channel_id = tag_associations.sql_channel_id
-                                      WHERE tag = ?
+                                      WHERE tag = ? AND muted = 0
                                       ORDER BY time_published DESC
                                       LIMIT ? OFFSET ?''', (tag, number_per_page*9, offset)).fetchall()
     else:
         db_videos = cursor.execute('''SELECT video_id, title, duration, time_published, is_time_published_exact, channel_name
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
+                                      WHERE muted = 0
                                       ORDER BY time_published DESC
                                       LIMIT ? OFFSET ?''', (number_per_page*9, offset)).fetchall()
 
-- 
cgit v1.2.3


From d80a8b1c3f691b2cc488a6995035a1aef8590d46 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 17 Aug 2019 13:52:32 -0700
Subject: Subscriptions: Hopefully fix autochecking being scheduled in the past

---
 youtube/subscriptions.py | 32 ++++++++++++++++++++------------
 1 file changed, 20 insertions(+), 12 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index a4fef5a..93767b7 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -317,7 +317,7 @@ for i in range(0,5):
 
 
-# --- Auto checking system ---
+# --- Auto checking system - Spaghetti code ---
 
 if settings.autocheck_subscriptions:
     # job application format: dict with keys (channel_id, channel_name, next_check_time)
@@ -328,7 +328,10 @@ if settings.autocheck_subscriptions:
         with connection as cursor:
             now = time.time()
             for row in cursor.execute('''SELECT yt_channel_id, channel_name, next_check_time FROM subscribed_channels WHERE next_check_time IS NOT NULL AND muted != 1''').fetchall():
-                if row[2] < now:    # expired, check randomly within the 30 minutes
+
+                # expired, check randomly within the 30 minutes
+                # note: even if it isn't scheduled in the past right now, it might end up being if it's due soon and we dont start dispatching by then, see below where time_until_earliest_job is negative
+                if row[2] < now:
                     next_check_time = now + 3600*secrets.randbelow(60)/60
                     row = (row[0], row[1], next_check_time)
                     _schedule_checking(cursor, row[0], next_check_time)
@@ -347,7 +350,7 @@ if settings.autocheck_subscriptions:
                 earliest_job = autocheck_jobs[earliest_job_index]
                 time_until_earliest_job = earliest_job['next_check_time'] - time.time()
 
-                if time_until_earliest_job <= 0:
+                if time_until_earliest_job <= -5:   # should not happen unless we're running extremely slow
                     print('ERROR: autocheck_dispatcher got job scheduled in the past, skipping and rescheduling: ' + earliest_job['channel_id'] + ', ' + earliest_job['channel_name'] + ', ' + str(earliest_job['next_check_time']))
                     next_check_time = time.time() + 3600*secrets.randbelow(60)/60
                     with_open_db(_schedule_checking, earliest_job['channel_id'], next_check_time)
@@ -359,15 +362,20 @@ if settings.autocheck_subscriptions:
                     del autocheck_jobs[earliest_job_index]
                     continue
 
-                try:
-                    new_job = autocheck_job_application.get(timeout = time_until_earliest_job)  # sleep for time_until_earliest_job time, but allow to be interrupted by new jobs
-                except gevent.queue.Empty: # no new jobs, time to execute the earliest job
-                    channel_names[earliest_job['channel_id']] = earliest_job['channel_name']
-                    checking_channels.add(earliest_job['channel_id'])
-                    check_channels_queue.put(earliest_job['channel_id'])
-                    del autocheck_jobs[earliest_job_index]
-                else: # new job, add it to the list
-                    autocheck_jobs.append(new_job)
+                if time_until_earliest_job > 0: # it can become less than zero (in the past) when it's set to go off while the dispatcher is doing something else at that moment
+                    try:
+                        new_job = autocheck_job_application.get(timeout = time_until_earliest_job)  # sleep for time_until_earliest_job time, but allow to be interrupted by new jobs
+                    except gevent.queue.Empty: # no new jobs
+                        pass
+                    else: # new job, add it to the list
+                        autocheck_jobs.append(new_job)
+                        continue
+
+                # no new jobs, time to execute the earliest job
+                channel_names[earliest_job['channel_id']] = earliest_job['channel_name']
+                checking_channels.add(earliest_job['channel_id'])
+                check_channels_queue.put(earliest_job['channel_id'])
+                del autocheck_jobs[earliest_job_index]
 
 
     gevent.spawn(autocheck_dispatcher)
-- 
cgit v1.2.3


From 71632a23f51025a17b3edf19979b2b40d46a2631 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Sat, 17 Aug 2019 13:54:54 -0700
Subject: Subscriptions: Add watched column in database for future feature

---
 youtube/subscriptions.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 93767b7..5f17ee6 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -51,7 +51,8 @@ def open_database():
                               duration text,
                               time_published integer NOT NULL,
                               is_time_published_exact integer DEFAULT 0,
-                              description text
+                              description text,
+                              watched integer default 0
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS tag_associations (
                               id integer PRIMARY KEY,
-- 
cgit v1.2.3


From 0a590c3364612d8c981fe25aac14d809b65a2dc1 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Mon, 2 Sep 2019 19:10:38 -0700
Subject: Subscriptions: Order videos by the time they were added to db

---
 youtube/subscriptions.py | 106 ++++++++++++++++++++++++++---------------------
 1 file changed, 58 insertions(+), 48 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index 5f17ee6..be5ecbe 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -39,8 +39,8 @@ def open_database():
                               id integer PRIMARY KEY,
                               yt_channel_id text UNIQUE NOT NULL,
                               channel_name text NOT NULL,
-                              time_last_checked integer,
-                              next_check_time integer,
+                              time_last_checked integer DEFAULT 0,
+                              next_check_time integer DEFAULT 0,
                               muted integer DEFAULT 0
                           )''')
         cursor.execute('''CREATE TABLE IF NOT EXISTS videos (
@@ -51,6 +51,7 @@ def open_database():
                               duration text,
                               time_published integer NOT NULL,
                               is_time_published_exact integer DEFAULT 0,
+                              time_noticed integer NOT NULL,
                               description text,
                               watched integer default 0
                           )''')
@@ -96,11 +97,10 @@ def is_subscribed(channel_id):
 def _subscribe(cursor, channels):
     ''' channels is a list of (channel_id, channel_name) '''
 
-    # set time_last_checked to 0 on all channels being subscribed to
-    channels = ( (channel_id, channel_name, 0) for channel_id, channel_name in channels)
+    channels = ( (channel_id, channel_name, 0, 0) for channel_id, channel_name in channels)
 
-    cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked)
-                          VALUES (?, ?, ?)''', channels)
+    cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked, next_check_time)
+                          VALUES (?, ?, ?, ?)''', channels)
 
 
 def delete_thumbnails(to_delete):
@@ -146,14 +146,14 @@ def _get_videos(cursor, number_per_page, offset, tag = None):
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       INNER JOIN tag_associations on videos.sql_channel_id = tag_associations.sql_channel_id
                                       WHERE tag = ? AND muted = 0
-                                      ORDER BY time_published DESC
+                                      ORDER BY time_noticed DESC, time_published DESC
                                       LIMIT ? OFFSET ?''', (tag, number_per_page*9, offset)).fetchall()
     else:
         db_videos = cursor.execute('''SELECT video_id, title, duration, time_published, is_time_published_exact, channel_name
                                       FROM videos
                                       INNER JOIN subscribed_channels on videos.sql_channel_id = subscribed_channels.id
                                       WHERE muted = 0
-                                      ORDER BY time_published DESC
+                                      ORDER BY time_noticed DESC, time_published DESC
                                       LIMIT ? OFFSET ?''', (number_per_page*9, offset)).fetchall()
 
     pseudo_number_of_videos = offset + len(db_videos)
@@ -328,15 +328,20 @@ if settings.autocheck_subscriptions:
     with open_database() as connection:
         with connection as cursor:
             now = time.time()
-            for row in cursor.execute('''SELECT yt_channel_id, channel_name, next_check_time FROM subscribed_channels WHERE next_check_time IS NOT NULL AND muted != 1''').fetchall():
+            for row in cursor.execute('''SELECT yt_channel_id, channel_name, next_check_time FROM subscribed_channels WHERE muted != 1''').fetchall():
 
-                # expired, check randomly within the 30 minutes
+                if row[2] is None:
+                    next_check_time = 0
+                else:
+                    next_check_time = row[2]
+
+                # expired, check randomly within the next hour
                 # note: even if it isn't scheduled in the past right now, it might end up being if it's due soon and we dont start dispatching by then, see below where time_until_earliest_job is negative
-                if row[2] < now:
+                if next_check_time < now:
                     next_check_time = now + 3600*secrets.randbelow(60)/60
                     row = (row[0], row[1], next_check_time)
                     _schedule_checking(cursor, row[0], next_check_time)
-                autocheck_jobs.append({'channel_id': row[0], 'channel_name': row[1], 'next_check_time': row[2]})
+                autocheck_jobs.append({'channel_id': row[0], 'channel_name': row[1], 'next_check_time': next_check_time})
 
 
@@ -400,8 +405,6 @@ def _get_upstream_videos(channel_id):
 
     print("Checking channel: " + channel_status_name)
 
-    videos = []
-
     tasks = (
         gevent.spawn(channel.get_channel_tab, channel_id, print_status=False), # channel page, need for video duration
         gevent.spawn(util.fetch_url, 'https://www.youtube.com/feeds/videos.xml?channel_id=' + channel_id) # atoma feed, need for exact published time
@@ -444,40 +447,47 @@ def _get_upstream_videos(channel_id):
         print('Failed to read atoma feed for ' + channel_status_name)
         traceback.print_exc()
 
-
-    channel_videos = channel.extract_info(json.loads(channel_tab), 'videos')['items']
-    for i, video_item in enumerate(channel_videos):
-        if 'description' not in video_item:
-            video_item['description'] = ''
-
-        if video_item['id'] in times_published:
-            video_item['time_published'] = times_published[video_item['id']]
-            video_item['is_time_published_exact'] = True
-        else:
-            video_item['is_time_published_exact'] = False
-            try:
-                video_item['time_published'] = youtube_timestamp_to_posix(video_item['published']) - i  # subtract a few seconds off the videos so they will be in the right order
-            except KeyError:
-                print(video_item)
-        videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], video_item['time_published'], video_item['is_time_published_exact'], video_item['description']))
-
-
-    if len(videos) == 0:
-        average_upload_period = 4*7*24*3600 # assume 1 month for channel with no videos
-    elif len(videos) < 5:
-        average_upload_period = int((time.time() - videos[len(videos)-1][4])/len(videos))
-    else:
-        average_upload_period = int((time.time() - videos[4][4])/5) # equivalent to averaging the time between videos for the last 5 videos
-
-    # calculate when to check next for auto checking
-    # add some quantization and randomness to make pattern analysis by Youtube slightly harder
-    quantized_upload_period = average_upload_period - (average_upload_period % (4*3600)) + 4*3600   # round up to nearest 4 hours
-    randomized_upload_period = quantized_upload_period*(1 + secrets.randbelow(50)/50*0.5) # randomly between 1x and 1.5x
-    next_check_delay = randomized_upload_period/10    # check at 10x the channel posting rate. might want to fine tune this number
-    next_check_time = int(time.time() + next_check_delay)
-
     with open_database() as connection:
         with connection as cursor:
+            is_first_check = cursor.execute('''SELECT time_last_checked FROM subscribed_channels WHERE yt_channel_id=?''', [channel_id]).fetchone()[0] in (None, 0)
+            video_add_time = int(time.time())
+
+            videos = []
+            channel_videos = channel.extract_info(json.loads(channel_tab), 'videos')['items']
+            for i, video_item in enumerate(channel_videos):
+                if 'description' not in video_item:
+                    video_item['description'] = ''
+
+                if video_item['id'] in times_published:
+                    time_published = times_published[video_item['id']]
+                    is_time_published_exact = True
+                else:
+                    is_time_published_exact = False
+                    try:
+                        time_published = youtube_timestamp_to_posix(video_item['published']) - i  # subtract a few seconds off the videos so they will be in the right order
+                    except KeyError:
+                        print(video_item)
+                if is_first_check:
+                    time_noticed = time_published  # don't want a crazy ordering on first check, since we're ordering by time_noticed
+                else:
+                    time_noticed = video_add_time
+                videos.append((channel_id, video_item['id'], video_item['title'], video_item['duration'], time_published, is_time_published_exact, time_noticed, video_item['description']))
+
+
+            if len(videos) == 0:
+                average_upload_period = 4*7*24*3600 # assume 1 month for channel with no videos
+            elif len(videos) < 5:
+                average_upload_period = int((time.time() - videos[len(videos)-1][4])/len(videos))
+            else:
+                average_upload_period = int((time.time() - videos[4][4])/5) # equivalent to averaging the time between videos for the last 5 videos
+
+            # calculate when to check next for auto checking
+            # add some quantization and randomness to make pattern analysis by Youtube slightly harder
+            quantized_upload_period = average_upload_period - (average_upload_period % (4*3600)) + 4*3600   # round up to nearest 4 hours
+            randomized_upload_period = quantized_upload_period*(1 + secrets.randbelow(50)/50*0.5) # randomly between 1x and 1.5x
+            next_check_delay = randomized_upload_period/10    # check at 10x the channel posting rate. might want to fine tune this number
+            next_check_time = int(time.time() + next_check_delay)
+
             # calculate how many new videos there are
             row = cursor.execute('''SELECT video_id
                                     FROM videos
@@ -496,8 +506,8 @@ def _get_upstream_videos(channel_id):
                     index += 1
                 number_of_new_videos = index
 
-            cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, is_time_published_exact, description)
-                                  VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?, ?)''', videos)
+            cursor.executemany('''INSERT OR IGNORE INTO videos (sql_channel_id, video_id, title, duration, time_published, is_time_published_exact, time_noticed, description)
+                                  VALUES ((SELECT id FROM subscribed_channels WHERE yt_channel_id=?), ?, ?, ?, ?, ?, ?, ?)''', videos)
             cursor.execute('''UPDATE subscribed_channels
                               SET time_last_checked = ?, next_check_time = ?
                               WHERE yt_channel_id=?''', [int(time.time()), next_check_time, channel_id])
-- 
cgit v1.2.3


From c393031ac54af959561214c8b1d6b22647a81b89 Mon Sep 17 00:00:00 2001
From: James Taylor <user234683@users.noreply.github.com>
Date: Tue, 3 Sep 2019 17:47:23 -0700
Subject: Subscriptions: autocheck after subscribing to channel

---
 youtube/subscriptions.py | 42 +++++++++++++++++++++++++-----------------
 1 file changed, 25 insertions(+), 17 deletions(-)

(limited to 'youtube')

diff --git a/youtube/subscriptions.py b/youtube/subscriptions.py
index be5ecbe..2e821de 100644
--- a/youtube/subscriptions.py
+++ b/youtube/subscriptions.py
@@ -79,29 +79,37 @@ def with_open_db(function, *args, **kwargs):
         with connection as cursor:
             return function(cursor, *args, **kwargs)
 
+def _is_subscribed(cursor, channel_id):
+    result = cursor.execute('''SELECT EXISTS(
+                                   SELECT 1
+                                   FROM subscribed_channels
+                                   WHERE yt_channel_id=?
+                                   LIMIT 1
+                               )''', [channel_id]).fetchone()
+    return bool(result[0])
+
 def is_subscribed(channel_id):
     if not os.path.exists(database_path):
         return False
 
-    with open_database() as connection:
-        with connection as cursor:
-            result = cursor.execute('''SELECT EXISTS(
-                                           SELECT 1
-                                           FROM subscribed_channels
-                                           WHERE yt_channel_id=?
-                                           LIMIT 1
-                                       )''', [channel_id]).fetchone()
-            return bool(result[0])
-
+    return with_open_db(_is_subscribed, channel_id)
 
-def _subscribe(cursor, channels):
+def _subscribe(channels):
     ''' channels is a list of (channel_id, channel_name) '''
+    channels = list(channels)
+    with open_database() as connection:
+        with connection as cursor:
+            channel_ids_to_check = [channel[0] for channel in channels if not _is_subscribed(cursor, channel[0])]
 
-    channels = ( (channel_id, channel_name, 0, 0) for channel_id, channel_name in channels)
-
-    cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked, next_check_time)
-                          VALUES (?, ?, ?, ?)''', channels)
+            rows = ( (channel_id, channel_name, 0, 0) for channel_id, channel_name in channels)
+            cursor.executemany('''INSERT OR IGNORE INTO subscribed_channels (yt_channel_id, channel_name, time_last_checked, next_check_time)
+                                  VALUES (?, ?, ?, ?)''', rows)
 
+    if settings.autocheck_subscriptions:
+        # important that this is after the changes have been committed to database
+        # otherwise the autochecker (other thread) tries checking the channel before it's in the database
+        channel_names.update(channels)
+        check_channels_if_necessary(channel_ids_to_check)
 
 def delete_thumbnails(to_delete):
     for thumbnail in to_delete:
@@ -611,7 +619,7 @@ def import_subscriptions():
     else:
             return '400 Bad Request: Unsupported file format: ' + mime_type + '. Only subscription.json files (from Google Takeouts) and XML OPML files exported from Youtube\'s subscription manager page are supported', 400
 
-    with_open_db(_subscribe, channels)
+    _subscribe(channels)
 
     return flask.redirect(util.URL_ORIGIN + '/subscription_manager', 303)
 
@@ -757,7 +765,7 @@ def post_subscriptions_page():
     if action == 'subscribe':
         if len(request.values.getlist('channel_id')) != len(request.values.getlist('channel_name')):
             return '400 Bad Request, length of channel_id != length of channel_name', 400
-        with_open_db(_subscribe, zip(request.values.getlist('channel_id'), request.values.getlist('channel_name')))
+        _subscribe(zip(request.values.getlist('channel_id'), request.values.getlist('channel_name')))
 
     elif action == 'unsubscribe':
         with_open_db(_unsubscribe, request.values.getlist('channel_id'))
-- 
cgit v1.2.3