shithub: rrss

--- /dev/null

+++ b/README

@@ -1,0 +1,6 @@

+This is a fork of rrss (http://code.9front.org/hg/rrss) by Stanley Lieber.

+This version is modified to handle multiple feeds at once.

+When run the program expect a text files with the following format:

+<feed url> [tag1 [tag2 ... [tagN]]]

+For documentation refer to rrss.txt which is the original README of the program.

--- /dev/null

+++ b/main.go

@@ -1,0 +1,223 @@

+// RSS feed reader that outputs plain text, werc/apps/barf

+package main

+import (

+	"bufio"

+	"flag"

+	"fmt"

+	"io/ioutil"

+	"log"

+	"os"

+	"path"

+	"sort"

+	"strconv"

+	"strings"

+	"time"

+	"github.com/SlyMarbo/rss"

+)

+var (

+	debug	= flag.Bool("d", false, "print debug msgs to stderr")

+	format	= flag.String("f", "", "output format")

+	root    = flag.String("r", "", "output root")

+	dest	string

+	links 	string

+)

+type Article struct {

+	Title	string

+	Link	string

+	Date	time.Time

+	Content	string

+	Tags	[]string

+}

+type renderfn func(articles []Article)

+func usage() {

+	os.Stderr.WriteString("usage: rrss [-d] [-f barf|blagh] [-r root] <feed file>\n")

+	flag.PrintDefaults()

+	os.Exit(2)

+}

+func check(err error) {

+	if err != nil {

+		log.Fatal(err)

+	}

+}

+func isold(link string, path string) bool {

+	file, err := os.OpenFile(path, os.O_CREATE|os.O_RDONLY, 0775)

+	if err != nil {

+		return true

+	}

+	defer file.Close()

+	scanner := bufio.NewScanner(file)

+	for scanner.Scan() {

+		if strings.Contains(link, scanner.Text()) {

+			return true

+		}

+	}

+	return false

+}

+func makeold(link string, path string) (int, error) {

+	f, err := os.OpenFile(path, os.O_CREATE|os.O_WRONLY|os.O_APPEND, 0775)

+	defer f.Close()

+	check(err)

+	if link == "" {

+		link = "empty"

+	}

+	return f.WriteString(link + "\n")

+}

+func writef(dir, filename, content string) {

+	err := ioutil.WriteFile(path.Join(dir, filename), []byte(content+"\n"), 0775)

+	check(err)

+}

+func ensuredir(dir string) {

+	err := os.MkdirAll(dir, 0775)

+	check(err)

+}

+// http://code.9front.org/hg/barf

+func barf(articles []Article) {

+	dest = path.Join(*root, "src")

+	ensuredir(dest)

+	n := lastarticle(dest)

+	for _, a := range articles {

+		n = n + 1

+		d := fmt.Sprintf("%s/%d", dest, n)

+		ensuredir(d)

+		writef(d, "title", a.Title)

+		writef(d, "link", a.Link)

+		writef(d, "date", a.Date.String())

+		writef(d, "body", a.Content)

+		if a.Tags != nil {

+			ensuredir(path.Join(d, "tags"))

+			for _, j := range a.Tags {

+				f, err := os.Create(d + "/tags/" + j)

+				f.Close()

+				check(err)

+			}

+		}

+		_, err := makeold(a.Link, links)

+		check(err)

+	}

+}

+// http://werc.cat-v.org/apps/blagh

+func blagh(articles []Article) {

+	var err error

+	for _, a := range articles  {

+		dest = path.Join(*root, fmt.Sprintf("%d/%02d/%02d", a.Date.Year(), a.Date.Month(), a.Date.Day()));

+		ensuredir(dest)

+		f, _ := os.Open(dest) // directory will usually not exist yet

+		defer f.Close()

+		n, _ := f.Readdirnames(0)

+		d := fmt.Sprintf("%s/%d", dest, len(n))

+		ensuredir(d)

+		writef(d, "index.md", fmt.Sprintf("%s\n===\n\n%s\n", a.Title, a.Content))

+		_, err = makeold(a.Link, links)

+		check(err)

+	}

+}

+func stdout(articles []Article) {

+	for _, a := range articles {

+		fmt.Printf("title: %s\nlink: %s\ndate: %s\n%s\n\n",

+			a.Title, a.Link, a.Date, a.Content)

+	}

+}

+func lastarticle(dir string) int {

+	f, err := os.Open(dir)

+	defer f.Close()

+	check(err)

+	dn, err := f.Readdirnames(0)

+	check(err)

+	var di []int

+	for _, j := range dn {

+		k, _ := strconv.Atoi(j)

+		di = append(di, k)

+	}

+	sort.Ints(di)

+	n := 0

+	if di != nil {

+		n = di[len(di)-1]

+	}

+	return n

+}

+func loadfeed(url string, tags []string) []Article {

+	var articles []Article

+	if *debug {

+		log.Printf("Fetching feed '%s'", url)

+	}

+	feed, err := rss.Fetch(url)

+	if err != nil {

+		log.Printf("Cannot load feed '%s': %v", url, err)

+		return nil

+	}

+	for _, i := range feed.Items {

+		if isold(i.Link, links) {

+			continue

+		}

+		a := Article{i.Title, i.Link, i.Date, conorsum(i), tags}

+		articles = append(articles, a)

+	}

+	if *debug {

+		log.Printf("Loaded %d items", len(articles))

+	}

+	return articles

+}

+func conorsum(i *rss.Item) string {

+	if len(i.Content) > 0 {

+		return i.Content

+	}

+	if len(i.Summary) > 0 {

+		return i.Summary

+	}

+	return ""

+}

+func main() {

+	flag.Usage = usage

+	flag.Parse()

+	if flag.Arg(0) == "" {

+		usage()

+	}

+	var render renderfn

+	switch *format {

+	case "barf":

+		render = barf

+	case "blagh":

+		render = blagh

+	case "":

+		render = stdout

+	default:

+		usage()

+	}

+	links = path.Join(*root, "links")

+	file, err := os.Open(flag.Arg(0))

+	check(err)

+	defer file.Close()

+	scanner := bufio.NewScanner(file)

+	var articles []Article

+	var tags []string

+	for scanner.Scan() {

+		l := strings.Split(scanner.Text(), " ")

+		if len(l) > 1 {

+			tags = l[1:]

+		}

+		a := loadfeed(l[0], tags)

+		if a != nil {

+			articles = append(articles, a...)

+		}

+	}

+	sort.Slice(articles, func(i, j int) bool { return articles[i].Date.Before(articles[j].Date) })

+	render(articles)

+}

--- /dev/null

+++ b/rrss.txt

@@ -1,0 +1,41 @@

+     RRSS(1)                                                       RRSS(1)

+     NAME

+          rrss, trrss - RSS feed readers

+     SYNOPSIS

+          rrss [-f barf|blagh] [-r root] [-t tag] [-u url]

+          trrss [-f barf|blagh] [-r root] [-t tag] [-u url]

+     DESCRIPTION

+          Rrss pulls and parses an RSS feed.

+          There are a number of options:

+          -f   Place output in formatted directories for one

+               of two werc apps: barf or blagh. In the absence

+               of the -f flag, formatted output is placed on

+               stdout.

+               A file, links, is created in the root and is populated

+               with the URL of each feed item acquired. On sub-

+               sequent runs, URLs that appear in the links file are

+               not duplicated as new directories.

+          -r   Optionally, create barf or blagh directories

+               under root. Default is the current directory.

+          -t   Create tag for each post (barf only).

+          -u   The feed URL.

+          Trrss is a shell script that wraps the rrss program,

+          outputting plain text but preserving link URLs.

+     SOURCE

+          http://plan9.stanleylieber.com/src/rrss.tgz

+     SEE ALSO

+          http://werc.cat-v.org

+          http://werc.cat-v.org/apps/blagh

+          https://code.9front.org/hg/barf

--- /dev/null

+++ b/trrss

@@ -1,0 +1,8 @@

+#!/bin/rc

+# Run rrss and convert HTML to plain text, retaining link URLs.

+# NOTE: Requires plan9port or 9base. Fix the shebang path to rc.

+rrss $* | sed '

+	s/^title:.*$/<p>&/g

+	s/^link:.*$/<br>&/g

+	s/^date:.*$/<br>&<br>/g

+	' | tcs -t html | htmlfmt -a -c utf-8 | uhtml