nixos-config/modules/nixos/tasks/multimedia-archive/convert-newpipe-db-to-json

107 lines
3.4 KiB
Python
Executable File

#!/usr/bin/env nix-shell
#! nix-shell -i python3 -p python3
# This script is used for generating a JSON object from a Newpipe database to
# be used for multimedia archive task (i.e.,
# `config.tasks.multimedia-archive`).
import argparse
import sys
import sqlite3
import json
import re
import os
import shutil
import tempfile
import fileinput
from pathlib import Path
def kebab_case(string):
string = string.lower()
string = re.sub("\s+", "-", string)
string = re.sub("[^a-zA-Z0-9-]", "", string)
string = re.sub("-+", "-", string)
string = re.sub("^-|-$", "", string)
return string
def extract_categories_from_db(db_file, categories):
with sqlite3.connect(db_file) as db:
db.row_factory = sqlite3.Row
query = '''
SELECT subscriptions.name AS name, subscriptions.url AS url, feed_group.name AS tag
FROM subscriptions
INNER JOIN feed_group_subscription_join AS subs_join
INNER JOIN feed_group
ON subs_join.subscription_id = subscriptions.uid AND feed_group.uid = subs_join.group_id
ORDER BY name COLLATE NOCASE;
'''
data = { kebab_case(category) : [] for category in categories }
for row in db.execute(query):
tag = row["tag"]
if tag in categories:
data[kebab_case(tag)].append({ "url": row["url"], "name": row["name"] })
return data
def list_categories(db_file):
with sqlite3.connect(db_file) as db:
query = '''
SELECT name FROM feed_group ORDER BY name;
'''
data = []
for row in db.execute(query):
data.append(row[0])
return data
def extract_db(newpipe_archive):
tmpdir = tempfile.mkdtemp(suffix="convert-newpipe-db")
shutil.unpack_archive(newpipe_archive, tmpdir)
return Path(tmpdir)
if __name__ == "__main__":
parser = argparse.ArgumentParser()
parser.add_argument("newpipe_db", metavar="NEWPIPE_DB", help="Newpipe database file (as a zip file) exported straight from the app.")
parser.add_argument("categories", metavar="CATEGORIES", nargs="*", help="A list of categories to be extracted. If absent, it will extract with all categories.")
parser.add_argument("--list-categories", "-l", action="store_true", help="List all categories from the database.")
parser.add_argument("--output", "-o", action="store", metavar="FILE", help="If present, store the output in the given file")
args = parser.parse_args()
newpipe_archive = args.newpipe_db
tmpdir = extract_db(newpipe_archive)
db_file = tmpdir / "newpipe.db"
if args.list_categories:
for category in list_categories(db_file):
print(category)
else:
categories = []
if not sys.stdin.isatty():
for line in sys.stdin:
categories.append(line.strip())
if len(args.categories) > 0:
categories = args.categories
elif len(categories) == 0:
categories = list_categories(db_file)
data = extract_categories_from_db(db_file, categories)
output_file = args.output
if output_file:
with open(output_file, mode="w", encoding="UTF-8") as file:
json.dump(data, file, sort_keys=True, indent=2, ensure_ascii=False)
else:
print(json.dumps(data, sort_keys=True, indent=2, ensure_ascii=False))
shutil.rmtree(tmpdir)
# vi:ft=python:ts=4