rtrckr

yekm · Feb 13, 2025 · 87bcc67 · 87bcc67
1 parent eb97878
commit 87bcc67
Show file tree

Hide file tree

Showing 2 changed files with 182 additions and 0 deletions.
diff --git a/README.md b/README.md
@@ -104,6 +104,46 @@ delete torrents with their files
 
 qbt docs: https://github.com/qbittorrent/qBittorrent/wiki/WebUI-API-(qBittorrent-4.1)#torrent-management
 
+# rtrckr.sh
+
+Tool for interfacing with rutracker.org. Requires `rtrkr_curl.sh` to be available
+in PATH. `rtrkr_curl.sh` can be obtained in DevTools network window by seleceting
+`Copy as CURL` in the relevant menu item. After creating it must be edited to
+accept url as first parameter (also you can specify a `--proxy` parameter there).
+See a bottom of `rtrckr.sh` for an example.
+
+Search function relies on plain text database in TSV format. This database can be
+obtained by converting xml dump of all torrents (5591249 topic id) by running
+`rtrckr.sh xml2tsv`
+
+`rtrckr.sh grep` is the main command which finds words in tsv file. Equivalent to
+`cat $tsv | grep arg1 | grep arg2 | grep arg3 ...` (args is actually in reverse
+order but whatever)
+
+`rtrckr.sh find` same as grep but output is somewhat filtered. Sorted by size,
+outputs only certain columns (kinda unstable, but id should always be the first column)
+
+`rtrckr.sh download` download torrent file into /tmp and add it to a qbt via
+`qbtlib.sh add`
+
+`rtrckr.sh frompage` lists all torrent ids from a certain webpage. Useful to
+download a list of torrents from some forum topic.
+
+`rtrckr.sh xml2tsv` converts xml dump to a tsv database
+
+`rtrckr.sh curl` invokes rtrkr_curl.sh
+
+## usage
+
+find all torrents with `ubuntu` in title or forum name  
+`rtrckr.sh find ubuntu`
+
+download all relevant torrents to a certain directory  
+`rtrckr.sh find ubuntu bdremux | cut -f1 | parallel -j4 'rtrckr.sh download {} -F savepath=/mnt/all/film -F category=film -F tags=rtrckr -F paused=false'`
+
+download all torrents mentioned on certain page  
+`rtrckr.sh frompage https://rutracker.org/forum/viewtopic.php?t=6012098 | parallel -j4 'rtrckr.sh download {} -F savepath=/mnt/all/mult/FilmScan -F category=mult/fscan -F paused=false'`
+
 ## fun
 
 Total created processes:

diff --git a/rtrckr.sh b/rtrckr.sh
@@ -0,0 +1,142 @@
+#!/bin/bash
+
+#set -u
+
+export PATH=$BASH_SOURCE:$PATH
+
+die() {
+	echo $@
+	exit 1
+}
+
+helpall() {
+	argn=$(grep -P '^[\w\.]+\)' ${BASH_SOURCE[0]} | wc -l)
+	helpn=$(grep -w ' -n "$help" ] && die ' ${BASH_SOURCE[0]} | grep -v helpn | wc -l)
+	[ $argn -ne $helpn ] && echo incomplete help $helpn of $argn args && exit -1
+
+	cat ${BASH_SOURCE[0]} | grep -P '^[\w\.]+\)' | tr -d ')' | \
+		parallel --tag -k rtrckr.sh help | qbtlib.sh table
+
+	cat << EOF
+
+examples:
+
+rtrckr.sh find ubuntu bdremux
+rtrckr.sh ifind ubuntu bdremux | parallel --tag -j4 'rtrckr.sh download {} -F savepath=/mnt/all/film -F category= -F tags=rtrckr -F paused=false'
+rtrckr.sh frompage https://rutracker.org/forum/viewtopic.php?t=6012098 | parallel -j4 'rtrckr.sh download {} -F savepath=/mnt/all/mult/FilmScan -F category=mult/fscan -F paused=false'
+EOF
+
+	head -n1 $tsv
+	echo 'id time size title hash fid forum'
+	echo '1  2    3    4     5    6   7    '
+}
+
+tsv=$(dirname $(readlink "${BASH_SOURCE[0]}"))/rtrckr/rtrckr.tsv
+
+cmd=$1
+shift
+if [ "$cmd" = "help" ]; then
+	help=1
+	cmd=$1
+	shift
+fi
+
+[ -z "$cmd" ] && helpall && die
+
+case $cmd in
+grep)
+	[ -n "$help" ] && die 'find patterns in tsv file'
+	[ -s $tsv ] || die "error: no tsv file ($tsv), see xml2tsv.sh"
+	if [ -z "$1" ]; then
+		cat $tsv
+	else
+		rtrckr.sh grep ${@:2} | grep -i "$1"
+	fi
+	;;
+
+find)
+	[ -n "$help" ] && die 'find torrents, columns: size in GiB, name, forum'
+	#cat $tsv | grep $@ \
+	rtrckr.sh grep $@ \
+		| cut -f1,3,4,6,7 \
+		| sort -k2 -n \
+		| awk -F $'\t' ' BEGIN {OFS = FS} {$2 = $2/1024/1024/1024; print}' # \
+		#| qbtlib.sh table #-T3
+
+	;;
+ifind)
+	[ -n "$help" ] && die 'like find but output is only id, useful for `rtrckr.sh download`'
+	rtrckr.sh grep $@ \
+		| cut -f1
+	;;
+
+download)
+	[ -n "$help" ] && die 'download torrent with id `arg1` and add it to qbt. optional args -F savepath= -F category= -F tags= -F paused=true'
+	id=$1
+	# TODO: use permanent ~/.cache and warn on very old files?
+	tcache=/tmp/qbtlib.cache.$id.torrent
+	[ -s $tcache ] || rtrckr.sh curl https://rutracker.org/forum/dl.php?t=$id >$tcache
+	qbtlib.sh add $tcache ${@:2}
+	;;
+
+frompage)
+	[ -n "$help" ] && die 'extract torrent ids from links from page `arg1`'
+	rtrckr.sh curl $1 | \
+	iconv -f cp1251 | \
+	fq -d html -o array=true -r '.. | select(.[0] == "a" and (.[1].href|test("viewtopic.php.t=[0-9]+$")))? .[1].href' |
+	sed 's/.*t=\([0-9]\+\).*/\1/'
+	;;
+
+xml2tsv)
+	[ -n "$help" ] && die 'update tsv database from xml file `arg1`'
+	#last file from personal location if no argument
+	xml=${1:-$(ls -t /mnt/hall/rtrkr/rutracker-*.xml.xz | tail -n1)}
+
+	cat $xml \
+		| xz -d \
+		| pv -N xml -crabt \
+		| grep -e '<title>' -e '<torrent ' -e '<forum ' \
+		| tr '\n' '\r' \
+		| sed 's/\r </ </g' \
+		| tr '\r' '\n' \
+		| pv -N filtered -crabt \
+		| perl -pe 's/.*torrent id="(\d+)" registred_at="(.+)" size="(\d+)".*<title>(.*)<\/title>.*hash="(\w+)".*forum id="(\d+)">(.*)<\/forum>.*/$1\t$2\t$3\t$4\t$5\tfid:$6\t$7/' \
+		| pv -N tsv -crabt \
+		>$tsv
+	;;
+
+curl)
+	[ -n "$help" ] && die 'invoke rtrkr_curl.sh'
+	which rtrkr_curl.sh >/dev/null || die 'rtrkr_curl.sh not fount, see README.md'
+	rtrkr_curl.sh $@
+	;;
+
+*)
+	die no such command
+	;;
+
+esac
+
+set +vx
+
+
+#curl \
+#    $@ \
+#    -s -S -L -4 \
+#  -x socks5://127.0.0.1:5055 \
+#  -H 'accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7' \
+#  -H 'accept-language: en-US,en;q=0.9' \
+#  -H 'cache-control: max-age=0' \
+#  -H 'content-type: application/x-www-form-urlencoded' \
+#  -H 'cookie: bb_guid=...' \
+#  -H 'origin: https://rutracker.org' \
+#  -H 'priority: u=0, i' \
+#  -H 'sec-ch-ua: "Not/A)Brand";v="8", "Chromium";v="126", "Google Chrome";v="126"' \
+#  -H 'sec-ch-ua-mobile: ?0' \
+#  -H 'sec-ch-ua-platform: "Linux"' \
+#  -H 'sec-fetch-dest: document' \
+#  -H 'sec-fetch-mode: navigate' \
+#  -H 'sec-fetch-site: same-origin' \
+#  -H 'sec-fetch-user: ?1' \
+#  -H 'upgrade-insecure-requests: 1' \
+#  -H 'user-agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/126.0.0.0 Safari/537.36'