summaryrefslogtreecommitdiff
path: root/README
diff options
context:
space:
mode:
authorHiltjo Posthuma <hiltjo@codemadness.org>2021-04-22 20:22:27 +0200
committerHiltjo Posthuma <hiltjo@codemadness.org>2021-04-28 18:26:57 +0200
commit675cfe6a73b369d1eb7adefa6e59dc37259a513d (patch)
tree02950925e1c0437f8928289423a7ad3eae506854 /README
parent8ad3f119b2a41cda023a61bcb75aa96144d25e86 (diff)
README: update newsboat export script
Since newsboat version 2.22 (2020-12-21) it stores the content mime-type of a field so allow to export this. The older entries are empty and will be exported as "html" (even though they might have been plain-text). ... also add the (empty) category field.
Diffstat (limited to 'README')
-rw-r--r--README26
1 files changed, 16 insertions, 10 deletions
diff --git a/README b/README
index e903f32..2fef8b2 100644
--- a/README
+++ b/README
@@ -683,7 +683,6 @@ TSV format.
#
# Usage: create some directory to store the feeds, run this script.
#
- # Assumes "html" for content-type (Newsboat only handles HTML content).
# Assumes feednames are unique and a feed title is set.
# newsboat cache.db file.
@@ -698,11 +697,10 @@ TSV format.
.mode ascii
.output
SELECT
- i.pubDate, i.title, i.url, i.content, i.guid, i.author,
- i.enclosure_url,
- f.rssurl AS rssurl, f.title AS feedtitle, i.unread --,
- -- i.id, i.enclosure_type, i.enqueued, i.flags, i.deleted,
- -- i.base
+ i.pubDate, i.title, i.url, i.content, i.content_mime_type,
+ i.guid, i.author, i.enclosure_url,
+ f.rssurl AS rssurl, f.title AS feedtitle, i.unread
+ -- i.id, i.enclosure_type, i.enqueued, i.flags, i.deleted, i.base
FROM rss_feed f
INNER JOIN rss_item i ON i.feedurl = f.rssurl
ORDER BY
@@ -738,17 +736,25 @@ TSV format.
return title;
}
{
- fname = feedname($8, $9);
+ fname = feedname($9, $10);
if (!feed[fname]++) {
- print "Writing file: \"" fname "\" (title: " $9 ", url: " $8 ")" > "/dev/stderr";
+ print "Writing file: \"" fname "\" (title: " $10 ", url: " $9 ")" > "/dev/stderr";
}
+ contenttype = field($5);
+ if (contenttype == "")
+ contenttype = "html";
+ else if (index(contenttype, "/html") || index(contenttype, "/xhtml"))
+ contenttype = "html";
+ else
+ contenttype = "plain";
+
print $1 "\t" field($2) "\t" field($3) "\t" content($4) "\t" \
- "html" "\t" field($5) "\t" field($6) "\t" field($7) \
+ contenttype "\t" field($6) "\t" field($7) "\t" field($8) "\t" \
> fname;
# write URLs of the read items to a file line by line.
- if ($10 == "0") {
+ if ($11 == "0") {
print $3 > "urls";
}
}'