rssVideos: Replace guid by date and id

rssVideos: Sync read state
Deleted but previously downloaded = read
2021-12-29 14:43:13 +01:00 · 2021-12-29 12:56:07 +01:00 · 2021-12-28 21:39:27 +01:00 · 2021-12-28 21:39:10 +01:00
4 changed files with 92 additions and 57 deletions
--- a/config/automatrop/host_vars/curacao.geoffrey.frogeye.fr
+++ b/config/automatrop/host_vars/curacao.geoffrey.frogeye.fr
@ -17,3 +17,4 @@ extensions:
 x11_screens:
  - HDMI-0
  - eDP-1-1
+max_video_height: 1440
--- a/config/automatrop/host_vars/pindakaas.geoffrey.frogeye.fr
+++ b/config/automatrop/host_vars/pindakaas.geoffrey.frogeye.fr
@ -13,3 +13,4 @@ extensions:
 x11_screens:
  - DP-1
  - eDP-1
+max_video_height: 720
--- a/config/automatrop/roles/dotfiles/templates/rssVideos.j2
+++ b/config/automatrop/roles/dotfiles/templates/rssVideos.j2
@ -1,7 +0,0 @@
-{% set hostname = 'rss.frogeye.fr' %}
-{% set user = 'geoffrey' %}
-feed=https://{{ hostname }}/i/?a=rss&user={{ user }}&token={{ query('community.general.passwordstore', 'http/' + hostname + '/' + user + 'subkey=token' ) }}&hours=17520
-videos=~/Téléchargements/RSS
-subtitles=true
-max-duration=7200
-format=bestvideo[height<=1440]+bestaudio/best
--- a/config/scripts/rssVideos
+++ b/config/scripts/rssVideos
@ -8,7 +8,7 @@ The common use case would be a feed from an RSS aggregator
 with the unread items (non-video links are ignored).
 """

-import enum
+import datetime
 import functools
 import logging
 import os
@ -17,12 +17,8 @@ import random
 import requests
 import re
 import subprocess
-import sys
 import time
 import typing
-import urllib.parse
-import urllib.request
-import urllib.error

 import coloredlogs
 import configargparse
@ -31,7 +27,6 @@ import yt_dlp
 log = logging.getLogger(__name__)

 # TODO Lockfile, or a way to parallel watch and download
-# TODO Save ytdl infos and view info separately


 def configure_logging(args: configargparse.Namespace) -> None:
@ -113,13 +108,15 @@ class RVElement:
    parent: "RVDatabase"
    item: dict
    downloaded_filepath: typing.Optional[str]
-    watched: bool

    def __init__(self, parent: "RVDatabase", item: dict) -> None:
        self.parent = parent
        self.item = item
        self.downloaded_filepath = None
-        self.watched = False
+
+    @property
+    def id(self) -> str:
+        return self.item["id"]

    @property
    def title(self) -> str:
@ -134,8 +131,8 @@ class RVElement:
        return self.item["origin"]["title"]

    @property
-    def guid(self) -> int:
-        return int(self.item["timestampUsec"])
+    def date(self) -> datetime.datetime:
+        return datetime.datetime.fromtimestamp(self.item["published"])

    @property
    def is_researched(self) -> bool:
@ -147,19 +144,21 @@ class RVElement:
            log.debug(f"From cache: {self}")
        if cache.downloaded_filepath:
            self.downloaded_filepath = cache.downloaded_filepath
-        if cache.watched:
-            self.watched = True

    def __str__(self) -> str:
-        str = f"{self.guid}: {self.creator if self.creator else '?'} – {self.title}"
+        str = f"{self.date.strftime('%y-%m-%d %H:%M')} ("
        if self.is_researched:
            if self.is_video:
-                str += f" ({format_duration(self.duration)})"
+                str += format_duration(self.duration)
            else:
-                str += " (N/A)"
+                str += "--:--:--"
        else:
-            str += " (?)"
-        str += f" – {self.link}"
+            str += "??:??:??"
+        str += (
+            f") {self.creator if self.creator else '?'} "
+            f"– {self.title} "
+            f"– {self.link}"
+        )
        return str

    @property
@ -237,6 +236,12 @@ class RVElement:
            return
        self.download()

+    @property
+    def watched(self) -> bool:
+        if not self.is_researched:
+            return False
+        return self.was_downloaded and not self.downloaded
+
    def matches_filter(self, args: configargparse.Namespace) -> bool:
        # Inexpensive filters
        if args.seen != "any" and (args.seen == "seen") != self.watched:
@ -245,9 +250,6 @@ class RVElement:
        if args.title and not re.search(args.title, self.title):
            log.debug(f"Title not matching {args.title}: {self}")
            return False
-        if args.guid and not re.search(args.guid, str(self.guid)):
-            log.debug(f"Guid not matching {args.guid}: {self}")
-            return False
        if args.link and not re.search(args.link, self.link):
            log.debug(f"Link not matching {args.link}: {self}")
            return False
@ -277,8 +279,8 @@ class RVElement:
            proc = subprocess.run(cmd)
            proc.check_returncode()

-        self.watched = True
-        self.parent.save()
+        self.clean()
+        self.try_mark_read()

    def clean(self) -> None:
        assert self.is_video
@ -289,6 +291,32 @@ class RVElement:
                if not self.parent.args.dryrun:
                    os.unlink(file)

+    def mark_read(self) -> None:
+        log.debug(f"Marking {self} read")
+        if self.parent.args.dryrun:
+            return
+        r = requests.post(
+            f"{self.parent.args.url}/reader/api/0/edit-tag",
+            data={
+                "i": self.id,
+                "a": "user/-/state/com.google/read",
+                "ac": "edit",
+                "token": self.parent.feed_token,
+            },
+            headers=self.parent.auth_headers,
+        )
+        r.raise_for_status()
+        if r.text.strip() != "OK":
+            raise RuntimeError(f"Couldn't mark {self} as read: {r.text}")
+        log.info(f"Marked {self} as read")
+        self.parent.elements.remove(self)
+
+    def try_mark_read(self) -> None:
+        try:
+            self.mark_read()
+        except requests.ConnectionError:
+            log.warning(f"Couldn't mark {self} as read")
+

 class RVDatabase:
    SAVE_FILE = ".cache.p"
@ -322,26 +350,26 @@ class RVDatabase:
            self.auth_headers = cache.auth_headers

    def salvage_cache(self, cache: "RVDatabase") -> None:
-        log.debug(f"Salvaging cache")
+        log.debug("Salvaging cache")
        cache_els = dict()
        for cache_el in cache.elements:
-            cache_els[cache_el.guid] = cache_el
+            cache_els[cache_el.id] = cache_el
        for el in self.elements:
-            if el.guid in cache_els:
-                el.salvage_cache(cache_els[el.guid])
+            if el.id in cache_els:
+                el.salvage_cache(cache_els[el.id])

    def clean_cache(self, cache: "RVDatabase") -> None:
-        log.debug(f"Cleaning cache")
+        log.debug("Cleaning cache")
        self_els = dict()
        for self_el in self.elements:
-            self_els[self_el.guid] = self_el
+            self_els[self_el.id] = self_el
        for el in cache.elements:
-            if el.guid not in self_els:
+            if el.id not in self_els:
                if el.is_researched and el.is_video:
                    el.clean()

    def import_cache(self, cache: "RVDatabase") -> None:
-        log.debug(f"Importing cache")
+        log.debug("Importing cache")
        self.build_list([element.item for element in cache.elements])

    @functools.cached_property
@ -483,6 +511,20 @@ class RVDatabase:

        return elements

+    @functools.cached_property
+    def feed_token(self) -> str:
+        r = requests.get(
+            f"{self.args.url}/reader/api/0/token",
+            headers=self.auth_headers,
+        )
+        r.raise_for_status()
+        return r.text.strip()
+
+    def try_mark_watched_read(self) -> None:
+        for element in self.elements:
+            if element.watched:
+                element.try_mark_read()
+

 def get_args() -> configargparse.Namespace:
    defaultConfigPath = os.path.join(
@ -558,11 +600,11 @@ def get_args() -> configargparse.Namespace:
        default="old",
        help="Sorting mechanism",
    )
-    parser.add("--guid", help="Regex to filter guid")
    parser.add("--creator", help="Regex to filter by creator")
    parser.add("--title", help="Regex to filter by title")
    parser.add("--link", help="Regex to filter by link")
    parser.add("--duration", help="Comparative to filter by duration")
+    # TODO Date selector
    parser.add(
        "--seen",
        choices=("seen", "unseen", "any"),
@ -600,8 +642,6 @@ def get_args() -> configargparse.Namespace:
            "watch",
            "binge",
            "clean",
-            "seen",
-            "unseen",
        ),
        default="download",
    )
@ -614,13 +654,7 @@ def get_args() -> configargparse.Namespace:
    return args


-def main() -> None:
-    args = get_args()
-    configure_logging(args)
-
-    os.makedirs(args.videos, exist_ok=True)
-    os.chdir(args.videos)
-
+def get_database(args: configargparse.Namespace) -> RVDatabase:
    database = RVDatabase(args)
    cache = RVDatabase.load()
    feed_fetched = False
@ -635,6 +669,7 @@ def main() -> None:
                raise RuntimeError("Couldn't fetch feed, refusing to download")
                # This is a quirky failsafe in case of no internet connection,
                # so the script doesn't go noting that no element is a video.
+            log.warning(f"Couldn't fetch feed: {err}")
    if not feed_fetched:
        if cache:
            log.warning("Using cached feed.")
@ -646,12 +681,25 @@ def main() -> None:
        database.clean_cache(cache)
        database.save()

-    log.debug(f"Running action")
+    return database
+
+
+def main() -> None:
+    args = get_args()
+    configure_logging(args)
+
+    os.makedirs(args.videos, exist_ok=True)
+    os.chdir(args.videos)
+
+    database = get_database(args)
+
+    log.debug("Running action")
    if args.action == "clean":
        database.clean()
    else:
        duration = 0
        for element in database.filter(args):
+            duration += element.duration if element.is_video else 0
            if args.action == "download":
                element.preload()
            elif args.action == "list":
@ -660,19 +708,11 @@ def main() -> None:
                element.watch()
                if args.action == "watch":
                    break
-            elif args.action == "seen":
-                if not element.watched:
-                    log.info(f"Maked as seen: {element}")
-                    element.watched = True
-            elif args.action == "unseen":
-                if element.watched:
-                    log.info(f"Maked as unseen: {element}")
-                    element.watched = False
            else:
                raise NotImplementedError(f"Unimplemented action: {args.action}")
-            duration += element.duration if element.is_video else 0
        log.info(f"Total duration: {format_duration(duration)}")
        database.attempt_clean()
+    database.try_mark_watched_read()
    database.save()
Author	SHA1	Message	Date
Geoffrey Frogeye	8ae5c00f53	rssVideos: Replace guid by date and id	2021-12-29 14:43:13 +01:00
Geoffrey Frogeye	c36534f696	rssVideos: Sync read state Deleted but previously downloaded = read	2021-12-29 12:56:07 +01:00
Geoffrey Frogeye	b0f14812d5	rssVideos: config Moved to gdotfiles	2021-12-28 21:39:27 +01:00
Geoffrey Frogeye	21fd49f096	rssVideos: Clean up	2021-12-28 21:39:10 +01:00