#!/bin/sh # update feeds, merge with old feeds. # NOTE: assumes "sfeed_*" executables are in $PATH. # defaults sfeedpath="$HOME/.sfeed" sfeedfile="$sfeedpath/feeds" # temporary file for new feeds (for merging). sfeedfilenew="$sfeedfile.new" # load config (evaluate shellscript). # loadconfig(configfile) loadconfig() { # allow to specify config via argv[1]. if [ ! "$1" = "" ]; then # get absolute path of config file. config=$(readlink -f "$1") else # default config location. config="$HOME/.sfeed/sfeedrc" fi # load config: config is loaded here to be able to override above variables # (sfeedpath, sfeedfile, etc). if [ -r "$config" ]; then . "$config" else echo "Configuration file \"$config\" does not exist or is not readable." >&2 echo "See sfeedrc.example for an example." >&2 exit 1 fi } # merge raw files. # merge(oldfile, newfile) merge() { # unique sort by id, link, title. # order by feedname (asc), feedurl (asc) and timestamp (desc). (cat "$1" "$2" 2> /dev/null) | sort -t ' ' -u -k7,7 -k4,4 -k3,3 | sort -t ' ' -k10,10 -k11,11 -k1r,1 } # fetch a feed via HTTP/HTTPS etc. # fetchfeed(url, name, lastupdated) fetchfeed() { if curl -f -s -S -L --max-time 15 -z "$3" "$1"; then printf " OK %s %s\n" "`date +'%H:%M:%S'`" "$2" >&2 else printf "FAIL %s %s\n" "`date +'%H:%M:%S'`" "$2" >&2 fi } # convert encoding from one encoding to another. # convertencoding(from, to) convertencoding() { if [ ! "$1" = "" ] && [ ! "$2" = "" ] && [ ! "$1" = "$2" ]; then # from != to iconv -cs -f "$1" -t "$2" 2> /dev/null else cat # no convert, just output fi } # fetch and parse feed. # feed(name, feedurl, [basesiteurl], [encoding]) feed() { (tmpfeedfile=$(mktemp -p "$TMPDIR") tmpencfile="" encoding="$4" if [ ! "$encoding" = "" ]; then fetchfeed "$2" "$1" "$lastupdated" | convertencoding "$encoding" "utf-8" else # detect encoding. tmpencfile=$(mktemp -p "$TMPDIR") fetchfeed "$2" "$1" "$lastupdated" > "$tmpencfile" detectenc=$(sfeed_xmlenc < "$tmpencfile") convertencoding "$detectenc" "utf-8" < "$tmpencfile" rm -f "$tmpencfile" fi | sfeed "$1 $2 $3" > "$tmpfeedfile") & } terminated() { isrunning="0" } cleanup() { # remove temporary files rm -rf "$tmpfile" "$TMPDIR" } feeds() { echo "Configuration file \"$config\" is invalid or does not contain a \"feeds\" function." >&2 echo "See sfeedrc.example for an example." >&2 } # load config file. loadconfig "$1" # fetch feeds and store in temporary file. TMPDIR=$(mktemp -d "/tmp/sfeed_XXXXXX") # get date of last modified feedfile in format: # YYYYmmdd HH:MM:SS [+-][0-9]* lastupdated=$(stat -c "%y" "$sfeedfile" 2> /dev/null | cut -c 1-4,6-7,9-10,11-19,30-) # kill whole current process group on ^C. isrunning="1" # SIGTERM: signal to terminate parent. trap -- "terminated" "15" # SIGINT: kill all running childs >:D trap -- "kill -TERM -$$" "2" # fetch feeds specified in config file. feeds # make sure path exists. mkdir -p "$sfeedpath" # wait till all feeds are fetched (allows running in parallel). wait # if terminated cleanup. [ "$isrunning" = "0" ] && cleanup && exit 1 # concat all individual feed files to a single file. # NOTE: mktemp uses $TMPDIR for temporary directory. tmpfile=$(mktemp "sfeed_XXXXXX") find "$TMPDIR" -type f -exec cat {} \; > "$tmpfile" # get new data and merge with old. merge "$sfeedfile" "$tmpfile" > "$sfeedfilenew" # overwrite old file with updated file mv "$sfeedfilenew" "$sfeedfile" # cleanup temporary files etc. cleanup