2022-11-12 22:14:08 -06:00
|
|
|
;;
|
|
|
|
;; Copyright 2022, Jaidyn Levesque <jadedctrl@posteo.at>
|
|
|
|
;;
|
|
|
|
;; This program is free software: you can redistribute it and/or
|
|
|
|
;; modify it under the terms of the GNU General Public License as
|
|
|
|
;; published by the Free Software Foundation, either version 3 of
|
|
|
|
;; the License, or (at your option) any later version.
|
|
|
|
;;
|
|
|
|
;; This program is distributed in the hope that it will be useful,
|
|
|
|
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
;; GNU General Public License for more details.
|
|
|
|
;;
|
|
|
|
;; You should have received a copy of the GNU General Public License
|
|
|
|
;; along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
;;
|
|
|
|
|
|
|
|
(load "date-strings.scm")
|
|
|
|
(load "named-format.scm")
|
|
|
|
|
2022-11-18 21:48:35 -06:00
|
|
|
|
|
|
|
;; The main feedsnake module; parses atom feeds into alists and strings
|
2022-11-12 22:14:08 -06:00
|
|
|
(module feedsnake
|
2022-12-16 17:17:54 -06:00
|
|
|
(updated-feed-string read-feed entries-since write-entry write-entry-to-file write-entries-to-file all-entries entry->string
|
|
|
|
*maildir-template* *mbox-template*)
|
2022-11-12 22:14:08 -06:00
|
|
|
|
|
|
|
(import scheme
|
2022-12-16 17:17:54 -06:00
|
|
|
(chicken base) (chicken condition) (chicken io) (chicken file) (chicken process-context) (chicken pathname) (chicken port)
|
2022-11-23 12:38:22 -06:00
|
|
|
srfi-1 srfi-13 srfi-19 srfi-69
|
2022-11-12 22:14:08 -06:00
|
|
|
date-strings
|
|
|
|
http-client
|
|
|
|
named-format
|
2022-12-16 17:17:54 -06:00
|
|
|
xattr
|
2022-11-12 22:14:08 -06:00
|
|
|
atom rss)
|
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
(define *maildir-template*
|
|
|
|
`((entry-template
|
|
|
|
,(string-append
|
|
|
|
"From: ~{{~A ||||from-name}}"
|
|
|
|
"<~{{~A||feedsnake||FROM_USER||author-user||feed-title}}"
|
|
|
|
"@"
|
|
|
|
"~{{~A||localhost||FROM_HOST||author-domain||feed-domain}}>"
|
|
|
|
"\n"
|
|
|
|
"To:~{{ ~A ||You||TO_NAME||USER}}"
|
|
|
|
"<~{{~A||you||TO_USER||USER}}"
|
|
|
|
"@"
|
|
|
|
"~{{~A||localhost||TO_HOST||HOSTNAME}}>"
|
|
|
|
"\n"
|
|
|
|
"Subject: ~{{~A||Unnamed post||title}}\n"
|
|
|
|
"Date: ~{{~A||||updated-rfc228||published-rfc228}}\n"
|
|
|
|
"\n"
|
|
|
|
"~{{~{~a~^, ~}~%***~%||||urls}}\n"
|
|
|
|
"~{{~A||||summary}}\n"))
|
|
|
|
(multifile-output? #t)))
|
|
|
|
|
|
|
|
|
|
|
|
(define *mbox-template*
|
|
|
|
`((entry-template ,(string-append
|
|
|
|
"From FEEDSNAKE ~{{~A||||updated-mbox||published-mbox}}\n"
|
|
|
|
(car (alist-ref 'entry-template *maildir-template*))
|
|
|
|
"\n"))
|
|
|
|
(multifile-output? #f)))
|
|
|
|
|
|
|
|
(define *default-template*
|
|
|
|
(append *maildir-template*
|
|
|
|
'((output-dir "./"))))
|
|
|
|
|
|
|
|
(define *default-values*
|
|
|
|
'((output-dir "./")))
|
|
|
|
|
|
|
|
(define *default-multifile-values*
|
|
|
|
'((filename-template "~{{~A||||updated||published}}.~{{~A||you||USER}}@~{{~A||localhost|HOSTNAME}}")
|
|
|
|
(multifile-output? #t)))
|
|
|
|
|
|
|
|
(define *default-singlefile-values*
|
|
|
|
'((filename-template "feed.out")
|
|
|
|
(multifile-output? #f)))
|
|
|
|
|
|
|
|
|
2022-11-12 22:14:08 -06:00
|
|
|
;; Read the given port into a feedsnake-feed (alist), no matter the format! c:<
|
|
|
|
(define (read-feed in-port)
|
|
|
|
(let (;;[rss (rss:read in-port)]
|
|
|
|
[atom (read-atom-feed in-port)])
|
|
|
|
(if atom
|
|
|
|
(atom-doc->feedsnake-feed atom)
|
|
|
|
#f)))
|
|
|
|
|
|
|
|
|
|
|
|
;; A list of entries updated since the given date
|
|
|
|
(define (entries-since feed date-utc)
|
|
|
|
(let ([entry-date (lambda (entry) (car (alist-ref 'updated entry)))]
|
|
|
|
[since-entries '()])
|
|
|
|
(map
|
|
|
|
(lambda (entry)
|
|
|
|
(if (date>=? (entry-date entry) date-utc)
|
|
|
|
(set! since-entries
|
|
|
|
(append since-entries (list entry)))))
|
|
|
|
(car (alist-ref 'entries feed)))
|
|
|
|
since-entries))
|
|
|
|
|
|
|
|
|
|
|
|
;; Returns either the updated string of a feed (in comparison to old string),
|
|
|
|
;; or #f if literally nothing's changed
|
|
|
|
(define (updated-feed-string url old-string)
|
|
|
|
(let* ([new-string (fetch-feed-string url)]
|
|
|
|
[updated? (not (eq? (hash old-string) (hash new-string)))])
|
|
|
|
(if updated?
|
|
|
|
new-string
|
|
|
|
#f)))
|
|
|
|
|
|
|
|
|
|
|
|
;; Download a feed (AKA fetch over HTTP to a string)
|
|
|
|
(define (fetch-feed-string url)
|
|
|
|
(call-with-output-string
|
|
|
|
(lambda (out) (fetch-http url out))))
|
|
|
|
|
|
|
|
|
|
|
|
(define (entry->string entry template)
|
|
|
|
(named-format
|
|
|
|
template
|
2022-11-18 21:48:35 -06:00
|
|
|
(append entry
|
|
|
|
(entry-templating-parameters entry template))))
|
2022-11-12 22:14:08 -06:00
|
|
|
|
|
|
|
|
|
|
|
;; Returns an alist of string replacements/parameters for a given entry
|
|
|
|
;; For use with named-format
|
2022-11-18 21:48:35 -06:00
|
|
|
(define (entry-templating-parameters entry template)
|
|
|
|
(append
|
|
|
|
entry
|
|
|
|
(entry-url-templating-parameters entry)
|
|
|
|
(entry-author-templating-parameters entry)
|
|
|
|
(entry-date-templating-parameters entry)))
|
|
|
|
|
|
|
|
|
|
|
|
;; URL-related named-format templating parameters for given entry
|
|
|
|
(define (entry-url-templating-parameters entry)
|
|
|
|
(let ([urls (alist-car-ref 'urls entry)])
|
|
|
|
`((url ,(cond
|
2022-11-12 22:14:08 -06:00
|
|
|
[(list? urls) (car urls)]
|
2022-11-18 21:48:35 -06:00
|
|
|
[(string? urls) urls])))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Author-related named-format templating parameters for given entry
|
|
|
|
(define (entry-author-templating-parameters entry)
|
|
|
|
(let* ([authors (alist-car-ref 'authors entry)]
|
|
|
|
[author (if authors (car authors) (alist-car-ref 'feed-title entry))])
|
|
|
|
`((author ,author))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Date-related named-format templating parameters for given entry
|
|
|
|
(define (entry-date-templating-parameters entry)
|
|
|
|
(let* ([updated (or (alist-car-ref 'updated entry) (alist-car-ref 'published entry))]
|
|
|
|
[published (or (alist-car-ref 'published entry) updated)])
|
|
|
|
`((updated-rfc228 ,(if updated (date->rfc228-string updated)))
|
|
|
|
(published-rfc228 ,(if published (date->rfc228-string published)))
|
|
|
|
(updated-mbox ,(if updated (date->mbox-string updated)))
|
|
|
|
(published-mbox ,(if published (date->mbox-string published))))))
|
2022-11-12 22:14:08 -06:00
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; Writes a given feed entry to the out-port, as per the feedsnake-unix-format template alist
|
|
|
|
(define (write-entry entry template-alist out-port)
|
|
|
|
(write-string
|
|
|
|
(entry->string (append (get-environment-variables) entry)
|
|
|
|
(alist-car-ref 'entry-template template-alist))
|
|
|
|
#f
|
|
|
|
out-port))
|
|
|
|
|
|
|
|
|
|
|
|
;; Write an entry to the given file (directory for multifile; normal file otherwise)
|
|
|
|
(define (write-entry-to-file entry template-alist out-path)
|
|
|
|
(let* ([template (if (alist-car-ref 'multifile-output? template-alist)
|
|
|
|
(append template-alist *default-multifile-values* *default-values*)
|
|
|
|
(append template-alist *default-singlefile-values* *default-values*))]
|
|
|
|
[file-mode (if (alist-car-ref 'multifile-output? template) #:text #:append)])
|
|
|
|
(call-with-output-file
|
|
|
|
(entry-output-path entry template out-path)
|
|
|
|
(lambda (out-port)
|
|
|
|
(write-entry entry template out-port))
|
|
|
|
file-mode)))
|
|
|
|
|
|
|
|
|
|
|
|
;; Writes all entries in a list to an out-path (mere convenience function)
|
|
|
|
(define (write-entries-to-file entries template-alist out-path)
|
|
|
|
(map (lambda (entry)
|
|
|
|
(write-entry-to-file entry template-alist out-path))
|
|
|
|
entries))
|
|
|
|
|
|
|
|
|
|
|
|
;; Decides the correct output path for an entry, given the template's filename rules etc.
|
|
|
|
(define (entry-output-path entry template-alist base-out-path)
|
|
|
|
(let ([multifile? (alist-car-ref 'multifile-output? template-alist)])
|
|
|
|
(if multifile?
|
|
|
|
(multifile-entry-path entry template-alist base-out-path)
|
|
|
|
(singlefile-entry-path entry template-alist base-out-path))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Output path for entry with a single-file template
|
|
|
|
(define (singlefile-entry-path entry template-alist base-out-path)
|
|
|
|
(if (directory-exists? base-out-path)
|
|
|
|
(signal
|
|
|
|
(make-property-condition
|
|
|
|
'exn 'location 'file
|
|
|
|
'message (string-append base-out-path " shouldn't be a directory.")))
|
|
|
|
base-out-path))
|
|
|
|
|
|
|
|
|
|
|
|
;; Output path for an entry w multifile template
|
|
|
|
(define (multifile-entry-path entry template-alist base-out-path)
|
|
|
|
(let* ([file-leaf (named-format (alist-car-ref 'filename-template template-alist) entry)])
|
|
|
|
(if (create-directory base-out-path)
|
|
|
|
(string-append base-out-path "/" file-leaf)
|
|
|
|
(signal
|
|
|
|
(make-property-condition
|
|
|
|
'exn 'location 'file
|
|
|
|
'message (string-append base-out-path " either isn't accessible or isn't a directory."))))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Switch the cached version of the feed with a newer version, if available
|
|
|
|
(define (update-feed-file feed-path)
|
|
|
|
(let* ([old-string (call-with-input-file feed-path
|
|
|
|
(lambda (in-port) (read-string #f in-port)))]
|
|
|
|
[new-string (updated-feed-string
|
|
|
|
(get-xattr feed-path "user.xdg.origin.url")
|
|
|
|
old-string)])
|
|
|
|
(if new-string
|
|
|
|
(call-with-output-file feed-path
|
|
|
|
(lambda (out) (write-string new-string #f out))))
|
|
|
|
new-string))
|
|
|
|
|
|
|
|
|
|
|
|
;; List of entries updated/published since last feed parsing
|
|
|
|
(define (latest-entries feed-path)
|
|
|
|
(let* ([feed (call-with-input-file feed-path read-feed)]
|
|
|
|
[xattr-last-update (get-xattr feed-path "user.feedsnake.parsed")]
|
|
|
|
[last-update (if xattr-last-update
|
|
|
|
(rfc339-string->date xattr-last-update)
|
|
|
|
(date->utc-date (make-date 0 0 0 0 01 01 1971)))])
|
|
|
|
(set-xattr feed-path "user.feedsnake.parsed"
|
|
|
|
(date->rfc339-string (current-date-utc)))
|
|
|
|
(entries-since feed last-update)))
|
|
|
|
|
|
|
|
|
|
|
|
;; List of all entries of the feed file
|
|
|
|
(define (all-entries feed-path)
|
|
|
|
(let ([feed (call-with-input-file feed-path read-feed)])
|
|
|
|
(car (alist-ref 'entries feed))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Atom parsing
|
|
|
|
;; ————————————————————————————————————————
|
|
|
|
|
2022-11-12 22:14:08 -06:00
|
|
|
;; Parse an atom feed into a feedsnake-friendly alist
|
|
|
|
(define (atom-doc->feedsnake-feed atom)
|
|
|
|
`((title ,(last (feed-title atom)))
|
2022-11-23 12:38:22 -06:00
|
|
|
(url ,(atom-feed-preferred-url atom))
|
2022-11-18 21:48:35 -06:00
|
|
|
(authors ,(map author-name (feed-authors atom)))
|
2022-11-12 22:14:08 -06:00
|
|
|
(updated ,(feed-updated atom))
|
|
|
|
(entry-updated ,(atom-feed-latest-entry-date atom))
|
2022-11-18 21:48:35 -06:00
|
|
|
(entries ,(map
|
|
|
|
(lambda (entry)
|
|
|
|
(atom-entry->feedsnake-entry entry atom))
|
|
|
|
(feed-entries atom)))))
|
2022-11-12 22:14:08 -06:00
|
|
|
|
|
|
|
|
|
|
|
;; Parse an atom entry into a feedsnake entry :>
|
2022-11-18 21:48:35 -06:00
|
|
|
(define (atom-entry->feedsnake-entry entry atom)
|
2022-11-12 22:14:08 -06:00
|
|
|
(let ([published (rfc339-string->date (entry-published entry))]
|
2022-11-18 21:48:35 -06:00
|
|
|
[updated (rfc339-string->date (entry-updated entry))]
|
|
|
|
[feed-authors (map author-name (feed-authors atom))]
|
|
|
|
[entry-authors (map author-name (entry-authors entry))])
|
2022-11-12 22:14:08 -06:00
|
|
|
`((title ,(last (entry-title entry)))
|
|
|
|
(updated ,(or updated published))
|
|
|
|
(published ,(or published updated))
|
|
|
|
(summary ,(last (entry-summary entry)))
|
2022-11-23 12:38:22 -06:00
|
|
|
(urls ,(map (lambda (link) (atom-link->string link atom))
|
|
|
|
(entry-links entry)))
|
2022-11-18 21:48:35 -06:00
|
|
|
(authors ,(if (null? entry-authors) feed-authors entry-authors))
|
2022-11-30 22:32:03 -06:00
|
|
|
(feed-title ,(last (feed-title atom))))))
|
2022-11-12 22:14:08 -06:00
|
|
|
|
|
|
|
|
2022-11-23 12:38:22 -06:00
|
|
|
;; The preferred/given URL for an atom feed
|
|
|
|
(define (atom-feed-preferred-url atom)
|
|
|
|
(car
|
|
|
|
(filter
|
|
|
|
(lambda (link)
|
|
|
|
(string=? (link-relation link) "self"))
|
|
|
|
(feed-links atom))))
|
|
|
|
|
|
|
|
|
2022-11-12 22:14:08 -06:00
|
|
|
;; Get an atom feed's latest date for an entry's updating/publishing
|
|
|
|
(define (atom-feed-latest-entry-date atom)
|
|
|
|
(let ([entry-date
|
|
|
|
(lambda (entry)
|
|
|
|
(or (rfc339-string->date (entry-updated entry))
|
|
|
|
(rfc339-string->date (entry-published entry))))])
|
|
|
|
(reduce
|
|
|
|
(lambda (a b)
|
|
|
|
(if (date>=? a b) a b))
|
|
|
|
#f
|
|
|
|
(map entry-date (feed-entries atom)))))
|
|
|
|
|
|
|
|
|
2022-11-23 12:38:22 -06:00
|
|
|
;; Convert an atom-link into a proper, valid url
|
|
|
|
(define (atom-link->string link atom)
|
|
|
|
(if (string-contains (link-uri link) "://")
|
|
|
|
(link-uri link)
|
|
|
|
(string-append (pathname-directory (atom-feed-preferred-url atom))
|
|
|
|
"/"
|
|
|
|
(link-uri link))))
|
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; Misc. functions
|
|
|
|
;; ————————————————————————————————————————
|
|
|
|
|
|
|
|
;; Just car's the value of alist-ref (if it exists)
|
|
|
|
(define (alist-car-ref key alist)
|
|
|
|
(let ([value (alist-ref key alist)])
|
|
|
|
(if value
|
|
|
|
(car value)
|
|
|
|
#f)))
|
|
|
|
|
|
|
|
|
2022-11-12 22:14:08 -06:00
|
|
|
;; Download a file over HTTP to the given port.
|
|
|
|
(define (fetch-http url out-port)
|
|
|
|
(call-with-input-request
|
|
|
|
url #f
|
|
|
|
(lambda (in-port) (copy-port in-port out-port))))
|
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; Convert a date of arbitrary timezone to UTC
|
|
|
|
(define (date->utc-date date)
|
|
|
|
(time-utc->date (date->time-utc date)))
|
2022-11-12 22:14:08 -06:00
|
|
|
|
2022-11-18 21:48:35 -06:00
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; The current date, with UTC (-0; Z) timezone
|
|
|
|
(define (current-date-utc)
|
|
|
|
(date->utc-date (current-date)))
|
2022-11-18 21:48:35 -06:00
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
) ;; feedsnake module
|
2022-11-18 21:48:35 -06:00
|
|
|
|
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; The UNIX-style frontend for feedsnake
|
|
|
|
(module feedsnake-unix
|
|
|
|
(main main)
|
2022-11-18 21:48:35 -06:00
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
(import scheme
|
|
|
|
(chicken base) (chicken file) (chicken file posix) (chicken io)
|
|
|
|
(chicken process-context) (chicken process-context posix)
|
|
|
|
srfi-1
|
|
|
|
feedsnake
|
|
|
|
getopt-long)
|
2022-11-18 21:48:35 -06:00
|
|
|
|
|
|
|
|
2022-12-01 20:31:09 -06:00
|
|
|
(define *help-msg*
|
|
|
|
(string-append
|
|
|
|
"usage: feedsnake [-h] FILE...\n"
|
|
|
|
"Feedsnake is a program for converting Atom feeds into mbox/maildir files.\n"
|
|
|
|
"Any Atom feeds passed as an argument will be output in mbox format.\n\n"))
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
|
2022-12-01 20:31:09 -06:00
|
|
|
(define *opts*
|
|
|
|
'((help
|
|
|
|
"Print a usage message"
|
2022-12-16 17:17:54 -06:00
|
|
|
(single-char #\h))
|
2022-12-17 13:43:13 -06:00
|
|
|
(outdir
|
|
|
|
"Output directory, used for maildir output"
|
|
|
|
(single-char #\d)
|
|
|
|
(value (required DIR)))
|
2022-12-16 17:17:54 -06:00
|
|
|
(output
|
2022-12-17 13:43:13 -06:00
|
|
|
"Output file, used for mbox output. Default is stdout."
|
2022-12-16 17:17:54 -06:00
|
|
|
(single-char #\o)
|
|
|
|
(value (required FILE)))))
|
|
|
|
|
|
|
|
|
|
|
|
;; Prints cli usage to stderr.
|
|
|
|
(define (help)
|
|
|
|
(write-string *help-msg* #f (open-output-file* fileno/stderr))
|
|
|
|
(write-string (usage *opts*) #f (open-output-file* fileno/stderr)))
|
2022-12-01 20:31:09 -06:00
|
|
|
|
|
|
|
|
|
|
|
;; The `main` procedure that should be called to run feedsnake-unix for use as script.
|
|
|
|
;; TODO: accept piped-in feeds
|
|
|
|
(define (main)
|
2022-12-16 17:17:54 -06:00
|
|
|
(let* ([args (getopt-long (command-line-arguments) *opts*)]
|
2022-12-17 13:43:13 -06:00
|
|
|
[output-dir (alist-ref 'outdir args)]
|
|
|
|
[output (or (alist-ref 'output args) output-dir)]
|
|
|
|
[template (if output-dir *maildir-template* *mbox-template*)])
|
2022-12-01 20:31:09 -06:00
|
|
|
(if (alist-ref 'help args)
|
|
|
|
(help)
|
|
|
|
(map (lambda (free-arg)
|
2022-12-16 17:17:54 -06:00
|
|
|
(cond [(not (file-exists? free-arg))
|
|
|
|
#f]
|
|
|
|
[output
|
2022-12-17 13:43:13 -06:00
|
|
|
(write-entries-to-file (all-entries free-arg) template output)]
|
2022-12-16 17:17:54 -06:00
|
|
|
[(not output)
|
|
|
|
(map (lambda (entry)
|
2022-12-17 13:43:13 -06:00
|
|
|
(write-entry entry template
|
2022-12-16 17:17:54 -06:00
|
|
|
(open-output-file* fileno/stdout)))
|
|
|
|
(all-entries free-arg))]))
|
2022-12-01 20:31:09 -06:00
|
|
|
(alist-ref '@ args)))))
|
|
|
|
|
|
|
|
|
2022-12-16 17:17:54 -06:00
|
|
|
;; Supposed config root of the user (as per XDG, or simple ~/.config)
|
2022-11-12 22:14:08 -06:00
|
|
|
(define (config-directory)
|
|
|
|
(or (get-environment-variable "XDG_CONFIG_HOME")
|
|
|
|
(string-append (sixth (user-information (current-user-id))) "/.config")))
|
|
|
|
|
|
|
|
|
|
|
|
;; Path of the feedsnake config directory
|
|
|
|
(define (feedsnake-directory)
|
|
|
|
(create-directory (string-append (config-directory) "/feedsnake") #t))
|
|
|
|
|
|
|
|
|
|
|
|
;; Path of the feeds directory
|
|
|
|
(define (feeds-directory)
|
|
|
|
(create-directory (string-append (feedsnake-directory) "/feeds") #t))
|
|
|
|
|
|
|
|
|
|
|
|
;; Lists all configured feeds (files in feed directory)
|
|
|
|
(define (feed-files)
|
|
|
|
(map (lambda (relative-path)
|
|
|
|
(string-append (feeds-directory) "/" relative-path))
|
|
|
|
(directory (feeds-directory))))
|
|
|
|
|
|
|
|
|
|
|
|
) ;; feedsnake-unix module
|