dotfiles/bin/convert-newpipe-db

#!/usr/bin/env nix-shell
#! nix-shell -i oil -p coreutils sqlite unzip ripgrep jq file

# Convert a Newpipe database (assuming it was exported within the app) into OPML v2.

# Dependencies:
# * osh (oil shell) v0.8.12
# * sqlite3 v3.34.0
# * unzip
# * ripgrep v12.1.1
# * jq
# * file

# Use the current Oil features in strict mode.
# This also enables usage of the syntax.
shopt -s strict:all

var FILENAME = $1

# Testing if the given file is a zip file.
file --mime $FILENAME | rg "application/zip" --quiet || exit 1
var channel_id_eggex = / 'https://www.youtube.com/channel/' (word) /

var NEWPIPE_DB = "newpipe.db"
var TEMP_FOLDER_NAME = "newpipe"

# The SQL query to get the required metadata.
var NEWPIPE_DB_QUERY = "
    SELECT name, url, service_id, group_concat(tag, ',') AS tags FROM (
        SELECT subscriptions.name, subscriptions.url, subscriptions.service_id, '/' || feed_group.name AS tag
        FROM subscriptions
        LEFT JOIN feed_group_subscription_join AS subs_join
        LEFT JOIN feed_group
        ON subs_join.subscription_id = subscriptions.uid AND feed_group.uid = subs_join.group_id
    ) GROUP BY name ORDER BY name COLLATE NOCASE;"

# Print the beginning of the template.
cat <<OPML
<opml version="2.0">
  <head>
    <title>Newpipe subscriptions</title>
    <dateCreated>$(date "+%F %T %z")</dateCreated>
    <ownerName>$(whoami)</ownerName>
    <docs>http://dev.opml.org/spec2.html</docs>
  </head>
  <body>
OPML

# Simply prints an `<outline>` element formatted approriately for the resulting output.
# Don't mind how it is printed right now. :)
proc print-outline(title, xml_url, html_url, tags = "") {
    printf '    <outline type="rss" xmlUrl="%s" htmlUrl="%s" title="%s" text="%s"' $xml_url $html_url $title $title

    if test -n $tags {
      printf ' category="%s"' $tags
    }

    printf '/>\n'
}

# Print the channels in the OPML body.
# This only occurs if the given file does have a Newpipe database.
if unzip -l $FILENAME | rg --quiet $NEWPIPE_DB {
    # Make the temporary directory (preferably on the current directory to make cleanup easier).
    mkdir $TEMP_FOLDER_NAME && unzip -q -u $FILENAME -d $TEMP_FOLDER_NAME

    # Setting up some automatic cleanup upon exit.
    trap "rm --recursive $TEMP_FOLDER_NAME" EXIT

    # Quickly check if a SQLite database is in the Newpipe database folder.
    file --mime "${TEMP_FOLDER_NAME}/${NEWPIPE_DB}" | rg --quiet "application/x-sqlite3" || exit 1

    # Extract the data from the database and process them individually.
    # Note that we formatted the data in CSV to be in one line per object since as of version 0.8.11, Oil has some problems when taking fully nested data from external commands (not yet completely verified).
    # We have to rewrite this part once Oil fixes the issue with nested objects.
    sqlite3 "${TEMP_FOLDER_NAME}/${NEWPIPE_DB}" "${NEWPIPE_DB_QUERY}" --csv --header \
    | dasel select --parser csv --multiple --selector '.[*]' --compact --write json \
    | while read channel {
        # We have separate each channel as a JSON object per line.
        echo $channel | json read :channel

        setvar name = channel['name']
        setvar url = channel['url']
        setvar service_id = channel['service_id']
        setvar tags = channel['tags']

        # The `service_id` column indicates where the channel came from the selection of platforms PeerTube offers.
        # Since the way to handle each platform differs to get the required data, we're throwing them in a case switch.
        case $service_id {
            # YouTube
            '0') {
                setvar channel_id = $(echo $url | sed --quiet --regexp-extended "s|$channel_id_eggex|\\1|p")
                setvar xml_url = "https://www.youtube.com/feeds/videos.xml?channel_id=${channel_id}"
            }
            ;;

            # Peertube instances
            '3') {
                # This naive solution just goes through the domain with the assumption that the database is exported properly from the app and not tampered with.
                # It can go into an infinite loop so take caution for now.
                setvar domain = $(echo $url | cut --delimiter='/' --fields='-3')
                setvar _domain_part_index = 4
                until (Bool($(curl --silent "$domain/api/v1/config/about" | dasel --parser json --selector ".instance.name"))) {
                    setvar domain = $(echo $url | cut --delimiter='/' --fields="-$_domain_part_index")
                    setvar _domain_part_index = Int($_domain_part_index) + 1
                }

                setvar channel_url = $(echo $url | cut --delimiter='/'  --fields='4-')
                setvar feed_type = $(echo $channel_url | rg "video-channels" --quiet && echo "videoChannelId" || echo "accountId")
                setvar channel_id = $(curl "${domain}/api/v1/${channel_url}" --silent | dasel --parser json --selector '.id')
                setvar xml_url = "$domain/feeds/videos.atom?$feed_type=$channel_id"
            }
            ;;
        }

        print-outline $name $xml_url $url $tags
    }
}

# Print the remaining parts of the document.
cat <<OPML
  </body>
</opml>
OPML
Update personal scripts 2021-08-08 17:07:46 +00:00			`#!/usr/bin/env nix-shell`
			`#! nix-shell -i oil -p coreutils sqlite unzip ripgrep jq file`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`# Convert a Newpipe database (assuming it was exported within the app) into OPML v2.`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
			`# Dependencies:`
Update personal scripts 2021-08-08 17:07:46 +00:00			`# * osh (oil shell) v0.8.12`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`# * sqlite3 v3.34.0`
			`# * unzip`
			`# * ripgrep v12.1.1`
			`# * jq`
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`# * file`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
			`# Use the current Oil features in strict mode.`
			`# This also enables usage of the syntax.`
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`shopt -s strict:all`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
			`var FILENAME = $1`

			`# Testing if the given file is a zip file.`
Revise personal scripts again 2021-04-30 14:21:11 +00:00			`file --mime $FILENAME \| rg "application/zip" --quiet \|\| exit 1`
			`var channel_id_eggex = / 'https://www.youtube.com/channel/' (word) /`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
			`var NEWPIPE_DB = "newpipe.db"`
			`var TEMP_FOLDER_NAME = "newpipe"`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00
			`# The SQL query to get the required metadata.`
			`var NEWPIPE_DB_QUERY = "`
			`SELECT name, url, service_id, group_concat(tag, ',') AS tags FROM (`
			`SELECT subscriptions.name, subscriptions.url, subscriptions.service_id, '/' \|\| feed_group.name AS tag`
			`FROM subscriptions`
			`LEFT JOIN feed_group_subscription_join AS subs_join`
			`LEFT JOIN feed_group`
			`ON subs_join.subscription_id = subscriptions.uid AND feed_group.uid = subs_join.group_id`
			`) GROUP BY name ORDER BY name COLLATE NOCASE;"`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
			`# Print the beginning of the template.`
			`cat <<OPML`
			`<opml version="2.0">`
			`<head>`
			`<title>Newpipe subscriptions</title>`
			`<dateCreated>$(date "+%F %T %z")</dateCreated>`
			`<ownerName>$(whoami)</ownerName>`
			`<docs>http://dev.opml.org/spec2.html</docs>`
			`</head>`
			`<body>`
			`OPML`

Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			# Simply prints an `<outline>` element formatted approriately for the resulting output.
			`# Don't mind how it is printed right now. :)`
			`proc print-outline(title, xml_url, html_url, tags = "") {`
Revise personal scripts again 2021-04-30 14:21:11 +00:00			`printf ' <outline type="rss" xmlUrl="%s" htmlUrl="%s" title="%s" text="%s"' $xml_url $html_url $title $title`
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00
			`if test -n $tags {`
			`printf ' category="%s"' $tags`
			`}`

			`printf '/>\n'`
			`}`

Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`# Print the channels in the OPML body.`
			`# This only occurs if the given file does have a Newpipe database.`
			`if unzip -l $FILENAME \| rg --quiet $NEWPIPE_DB {`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00			`# Make the temporary directory (preferably on the current directory to make cleanup easier).`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`mkdir $TEMP_FOLDER_NAME && unzip -q -u $FILENAME -d $TEMP_FOLDER_NAME`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00
			`# Setting up some automatic cleanup upon exit.`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`trap "rm --recursive $TEMP_FOLDER_NAME" EXIT`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00
			`# Quickly check if a SQLite database is in the Newpipe database folder.`
			`file --mime "${TEMP_FOLDER_NAME}/${NEWPIPE_DB}" \| rg --quiet "application/x-sqlite3" \|\| exit 1`

			`# Extract the data from the database and process them individually.`
			`# Note that we formatted the data in CSV to be in one line per object since as of version 0.8.11, Oil has some problems when taking fully nested data from external commands (not yet completely verified).`
			`# We have to rewrite this part once Oil fixes the issue with nested objects.`
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`sqlite3 "${TEMP_FOLDER_NAME}/${NEWPIPE_DB}" "${NEWPIPE_DB_QUERY}" --csv --header \`
			`\| dasel select --parser csv --multiple --selector '.[*]' --compact --write json \`
			`\| while read channel {`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00			`# We have separate each channel as a JSON object per line.`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`echo $channel \| json read :channel`
Refactor the custom scripts A lot of them are reaching to be bigger so I've refactored them similarly to C codebases with the `main()` entrypoint. Apparently, this is how bigger shell scripts are written like Neofetch, pfetch, and some Kubernetes helper scripts. 2021-09-07 09:54:23 +00:00
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`setvar name = channel['name']`
			`setvar url = channel['url']`
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`setvar service_id = channel['service_id']`
			`setvar tags = channel['tags']`

			# The `service_id` column indicates where the channel came from the selection of platforms PeerTube offers.
			`# Since the way to handle each platform differs to get the required data, we're throwing them in a case switch.`
			`case $service_id {`
			`# YouTube`
			`'0') {`
			`setvar channel_id = $(echo $url \| sed --quiet --regexp-extended "s\|$channel_id_eggex\|\\1\|p")`
			`setvar xml_url = "https://www.youtube.com/feeds/videos.xml?channel_id=${channel_id}"`
			`}`
			`;;`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`# Peertube instances`
			`'3') {`
			`# This naive solution just goes through the domain with the assumption that the database is exported properly from the app and not tampered with.`
			`# It can go into an infinite loop so take caution for now.`
			`setvar domain = $(echo $url \| cut --delimiter='/' --fields='-3')`
			`setvar _domain_part_index = 4`
			`until (Bool($(curl --silent "$domain/api/v1/config/about" \| dasel --parser json --selector ".instance.name"))) {`
			`setvar domain = $(echo $url \| cut --delimiter='/' --fields="-$_domain_part_index")`
			`setvar _domain_part_index = Int($_domain_part_index) + 1`
			`}`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`setvar channel_url = $(echo $url \| cut --delimiter='/' --fields='4-')`
			`setvar feed_type = $(echo $channel_url \| rg "video-channels" --quiet && echo "videoChannelId" \|\| echo "accountId")`
			`setvar channel_id = $(curl "${domain}/api/v1/${channel_url}" --silent \| dasel --parser json --selector '.id')`
			`setvar xml_url = "$domain/feeds/videos.atom?$feed_type=$channel_id"`
			`}`
			`;;`
			`}`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00
Update the scripts to be more "correct" 2021-03-29 12:55:58 +00:00			`print-outline $name $xml_url $url $tags`
			`}`
Add a script for converting Newpipe to OPML This script uses Oil shell as an initial test for writing scripts with Oil shell. I think it's a great starting example demonstrating the newer features such as eggexes and the new formatting of the blocks (e.g., if and while loops). Also, updated some scripts lel. 2021-02-23 04:36:58 +00:00			`}`

			`# Print the remaining parts of the document.`
			`cat <<OPML`
			`</body>`
			`</opml>`
			`OPML`