#!/usr/bin/env nix-shell #! nix-shell -i python3 -p python3 # This script is used for generating a JSON object from a Newpipe database to # be used for multimedia archive task (i.e., # `config.tasks.multimedia-archive`). import argparse import sys import sqlite3 import json import re import os import shutil import tempfile import fileinput from pathlib import Path def kebab_case(string): string = string.lower() string = re.sub("\s+", "-", string) string = re.sub("[^a-zA-Z0-9-]", "", string) string = re.sub("-+", "-", string) string = re.sub("^-|-$", "", string) return string def extract_categories_from_db(db_file, categories): with sqlite3.connect(db_file) as db: db.row_factory = sqlite3.Row query = ''' SELECT subscriptions.name AS name, subscriptions.url AS url, feed_group.name AS tag FROM subscriptions INNER JOIN feed_group_subscription_join AS subs_join INNER JOIN feed_group ON subs_join.subscription_id = subscriptions.uid AND feed_group.uid = subs_join.group_id ORDER BY name COLLATE NOCASE; ''' data = { kebab_case(category) : [] for category in categories } for row in db.execute(query): tag = row["tag"] if tag in categories: data[kebab_case(tag)].append({ "url": row["url"], "name": row["name"] }) return data def list_categories(db_file): with sqlite3.connect(db_file) as db: query = ''' SELECT name FROM feed_group ORDER BY name; ''' data = [] for row in db.execute(query): data.append(row[0]) return data def extract_db(newpipe_archive): tmpdir = tempfile.mkdtemp(suffix="convert-newpipe-db") shutil.unpack_archive(newpipe_archive, tmpdir) return Path(tmpdir) if __name__ == "__main__": parser = argparse.ArgumentParser() parser.add_argument("newpipe_db", metavar="NEWPIPE_DB", help="Newpipe database file (as a zip file) exported straight from the app.") parser.add_argument("categories", metavar="CATEGORIES", nargs="*", help="A list of categories to be extracted. If absent, it will extract with all categories.") parser.add_argument("--list-categories", "-l", action="store_true", help="List all categories from the database.") parser.add_argument("--output", "-o", action="store", metavar="FILE", help="If present, store the output in the given file") args = parser.parse_args() newpipe_archive = args.newpipe_db tmpdir = extract_db(newpipe_archive) db_file = tmpdir / "newpipe.db" if args.list_categories: for category in list_categories(db_file): print(category) else: categories = [] if not sys.stdin.isatty(): for line in sys.stdin: categories.append(line.strip()) if len(args.categories) > 0: categories = args.categories elif len(categories) == 0: categories = list_categories(db_file) data = extract_categories_from_db(db_file, categories) output_file = args.output if output_file: with open(output_file, mode="w", encoding="UTF-8") as file: json.dump(data, file, sort_keys=True, indent=2) else: print(json.dumps(data, sort_keys=True, indent=2)) shutil.rmtree(tmpdir) # vi:ft=python:ts=4