123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494 |
- ;;; org-feed.el --- Add RSS feed items to Org files
- ;;
- ;; Copyright (C) 2009 Free Software Foundation, Inc.
- ;;
- ;; Author: Carsten Dominik <carsten at orgmode dot org>
- ;; Keywords: outlines, hypermedia, calendar, wp
- ;; Homepage: http://orgmode.org
- ;; Version: 6.24trans
- ;;
- ;; This file is part of GNU Emacs.
- ;;
- ;; GNU Emacs is free software: you can redistribute it and/or modify
- ;; it under the terms of the GNU General Public License as published by
- ;; the Free Software Foundation, either version 3 of the License, or
- ;; (at your option) any later version.
- ;; GNU Emacs is distributed in the hope that it will be useful,
- ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
- ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- ;; GNU General Public License for more details.
- ;; You should have received a copy of the GNU General Public License
- ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
- ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
- ;;
- ;;; Commentary:
- ;; This library allows to create entries in an Org-mode file from
- ;; RSS feeds.
- ;;
- ;; Selecting feeds and target locations
- ;; -----------------------------------
- ;;
- ;; This module is configured through a single variable, `org-feed-alist'.
- ;; Here is an example, using a notes/tasks feed from reQall.com.
- ;;
- ;; (setq org-feed-alist
- ;; '(("ReQall"
- ;; "http://www.reqall.com/user/feeds/rss/a1b2c3....."
- ;; "~/org/feeds.org" "ReQall Entries")
- ;;
- ;; With this setup, the command `M-x org-feed-update-all' will
- ;; collect new entries in the feed at the given URL and create
- ;; entries as subheadings under the "ReQall Entries" heading in the
- ;; file "~/org.feeds.org".
- ;; In addition to these standard arguments, additional keyword-value
- ;; pairs are possible. For example, here we turn entries with
- ;; "<category>Task</category>" into TODO entries by adding the
- ;; keyword to the title, usinf the `:filter' argument:
- ;;
- ;; (setq org-feed-alist
- ;; '(("ReQall"
- ;; "http://www.reqall.com/user/feeds/rss/a1b2c3....."
- ;; "~/org/feeds.org" "ReQall Entries"
- ;; :filter my-reqall-filter)))
- ;;
- ;; (defun my-reqall-filter (e)
- ;; (when (equal (plist-get e :category) "Task")
- ;; (setq e (plist-put e :title
- ;; (concat "TODO " (plist-get e :title)))))
- ;; e)
- ;;
- ;; A `:template' entry in the alist would override the template
- ;; in `org-feed-default-template' for the construction of the outline
- ;; node to be inserted. Another possibility would be for the filter
- ;; function to create the Org node for the feed item, by adding the
- ;; formatted entry as a `:formatted-for-org' property:
- ;;
- ;; (defun my-reqall-filter (e)
- ;; (setq e (plist-put
- ;; e :formatted-for-org
- ;; (format "* %s\n%s"
- ;; (plist-get e :title)
- ;; (plist-get e :description))))
- ;; e)
- ;;
- ;; The filter function may also decide that certain feed items
- ;; should be ignored, by returning nil instead of the entry.
- ;;
- ;;
- ;; Keeping track of old GUIDs
- ;; --------------------------
- ;;
- ;; Since Org allows you to delete, archive, or move outline nodes,
- ;; org-feed.el needs to keep track of GUIDs in the feed it has
- ;; already processed. It does so by listing them in a special
- ;; drawer, FEEDGUIDS, under the heading that received the input of
- ;; the feed. You should add FEEDGUIDS to your list of drawers
- ;; in the files that receive feed input:
- ;;
- ;; #+DRAWERS: PROPERTIES LOGBOOK FEEDGUIDS
- ;;
- ;; Acknowledgements
- ;; ----------------
- ;;
- ;; org-feed.el is based on ideas by Brad Bozarth who implemented a
- ;; similar mechanism using shell and awk scripts, and who in this
- ;; way made me for the first time look into an RSS feed, showing
- ;; how simple this really was. Because I wanted to include a
- ;; solution into Org with as few dependencies as possible, I
- ;; reimplemented his ideas in Emacs Lisp.
- ;;; Code:
- (require 'org)
- (declare-function url-retrieve-synchronously "url" (url))
- (defgroup org-feed nil
- "Options concerning RSS feeds as inputs for Org files."
- :tag "Org ID"
- :group 'org)
- ;;;###autoload
- (defcustom org-feed-alist nil
- "Alist specifying RSS feeds that should create inputs for Org.
- Each entry in this list specified an RSS feed tat should be queried
- to create inbox items in Org. Each entry is a list with the following items:
- name a custom name for this feed
- URL the Feed URL
- file the target Org file where entries should be listed
- headline the headline under which entries should be listed
- Additional argumetns can be given using keyword-value pairs:
- :template template-string
- The template to create an Org node from a feed item
- :filter filter-function
- A function to filter entries before Org nodes are
- created from them.
- If no template is given, the one in `org-feed-default-template' is used.
- See the docstring of that variable for information on the syntax of this
- template. If creating the node required more logic than a template can
- provide, this task can be delegated to the filter function.
- The filter function gets as a argument a property list describing the item.
- That list has a property for each field, for example `:title' for the
- `<title>' field and `:pubDate' for the publication date. In addition,
- it contains the following properties:
- `:item-full-text' the full text in the <item> tag
- `:guid-permalink' t when the guid property is a permalink
- The filter function can modify the existing fields before an item
- is constructed using the template. Or it can construct the node directly,
- by adding a `:formatted-for-org' property that specifies the complete
- outline node that should be added.
- The filter should return the modified entry property list. It may also
- return nil to indicate that this entry should not be added to the Org file
- at all."
- :group 'org-feed
- :type '(repeat
- (list :value ("" "http://" "" "")
- (string :tag "Name")
- (string :tag "Feed URL")
- (file :tag "File for inbox")
- (string :tag "Headline for inbox")
- (repeat :inline t
- (choice
- (list :inline t :tag "Template"
- (const :template) (string :tag "Template"))
- (list :inline t :tag "Filter"
- (const :filter) (symbol :tag "Filter Function")))))))
- (defcustom org-feed-default-template "* %h\n %U\n %description\n %a\n"
- "Template for the Org node created from RSS feed items.
- This is just the default, each feed can specify its own.
- Any fields from the feed item can be interpolated into the template with
- %name, for example %title, %description, %pubDate etc. In addition, the
- following special escapes are valid as well:
- %h the title, or the first line of the description
- %t the date as a stamp, either from <pubDate> (if present), or
- the current date.
- %T date and time
- %u,%U like %t,%T, but inactive time stamps
- %a A link, from <guid> if that is a permalink, else from <link>"
- :group 'org-feed
- :type '(string :tag "Template"))
- (defcustom org-feed-save-after-adding t
- "Non-nil means, save buffer after adding new feed items."
- :group 'org-feed
- :type 'boolean)
- (defcustom org-feed-retrieve-method 'url-retrieve-synchronously
- "The method to be used to retrieve a feed URL.
- This can be `curl' or `wget' to call these external programs, or it can be
- an Emacs Lisp function that will return a buffer containing the content
- of the file pointed to by the URL."
- :group 'org-feed
- :type '(choice
- (const :tag "Internally with url.el" url-retrieve-synchronously)
- (const :tag "Externally with curl" curl)
- (const :tag "Externally with wget" wget)
- (function :tag "Function")))
- (defcustom org-feed-assume-stable t
- "Non-nil means, assume feeds to be stable.
- A stable feed is one which only adds and removes items, but never removes
- an item with a given GUID and then later adds it back in. So if the feed
- is stable, this means we can simple remember the GUIDs present in the feed
- at any given time, as the ones we have seen and precessed. So we can
- forget GUIDs that used to be in the feed but no longer are.
- Thus, for stable feeds, we only need to remember a limited number of GUIDs.
- For unstable ones, we need to remember all GUIDs we have ever seen, which
- can be a very long list indeed."
- :group 'org-feed
- :type 'boolean)
- (defcustom org-feed-before-adding-hook nil
- "Hook that is run before adding new feed items to a file.
- You might want to commit the file in its current state to version control,
- for example."
- :group 'org-feed
- :type 'hook)
- (defcustom org-feed-after-adding-hook nil
- "Hook that is run after new items have been added to a file.
- Depending on `org-feed-save-after-adding', the buffer will already
- have been saved."
- :group 'org-feed
- :type 'hook)
- (defvar org-feed-buffer "*Org feed*"
- "The buffer used to retrieve a feed.")
- ;;;###autoload
- (defun org-feed-update-all ()
- "Get inbox items from all feeds in `org-feed-alist'."
- (interactive)
- (let ((nfeeds (length org-feed-alist))
- (nnew (apply '+ (mapcar 'org-feed-update org-feed-alist))))
- (message "%s from %d %s"
- (cond ((= nnew 0) "No new entries")
- ((= nnew 1) "1 new entry")
- (t (format "%d new entries" nnew)))
- nfeeds
- (if (= nfeeds 1) "feed" "feeds"))))
- ;;;###autoload
- (defun org-feed-update (feed)
- "Get inbox items from FEED.
- FEED can be a string with an association in `org-feed-alist', or
- it can be a list structured like an entry in `org-feed-alist'."
- (interactive (list (org-completing-read "Feed name: " org-feed-alist)
- current-prefix-arg))
- (if (stringp feed) (setq feed (assoc feed org-feed-alist)))
- (unless feed
- (error "No such feed in `org-feed-alist"))
- (let ((feed-name (car feed))
- (feed-url (nth 1 feed))
- (feed-file (nth 2 feed))
- (feed-headline (nth 3 feed))
- (feed-filter (nth 1 (memq :filter feed)))
- (feed-template (or (nth 1 (memq :template feed))
- org-feed-default-template))
- feed-buffer feed-pos
- entries entries2 old-guids current-guids new new-selected e)
- (setq feed-buffer (org-feed-get-feed feed-url))
- (unless (and feed-buffer (bufferp feed-buffer))
- (error "Cannot get feed %s" feed-name))
- (setq entries (org-feed-parse-feed feed-buffer)
- entries2 entries)
- (ignore-errors (kill-buffer feed-buffer))
- (save-excursion
- (save-window-excursion
- (setq feed-pos (org-feed-goto-inbox-internal feed-file feed-headline))
- (setq old-guids (org-feed-get-old-guids feed-pos))
- (while (setq e (pop entries2))
- (unless (member (plist-get e :guid) old-guids)
- (push (org-feed-parse-entry e) new)))
- (if (not new)
- (progn (message "No new items in feed %s" feed-name) 0)
- ;; Format the new entries
- (run-hooks 'org-feed-before-adding-hook)
- (setq new-selected new)
- (when feed-filter
- (setq new-selected (mapcar feed-filter new-selected)))
- (setq new-selected
- (delq nil
- (mapcar
- (lambda (e) (org-feed-format-entry e feed-template))
- new-selected)))
- ;; Insert the new items
- (apply 'org-feed-add-items feed-pos new-selected)
- ;; Update the list of seen GUIDs in a drawer
- (if org-feed-assume-stable
- (apply 'org-feed-add-guids feed-pos 'replace entries)
- (apply 'org-feed-add-guids feed-pos nil new))
- (goto-char feed-pos)
- (show-children)
- (when org-feed-save-after-adding
- (save-buffer))
- (message "Added %d new item%s from feed %s to file %s, heading %s"
- (length new) (if (> (length new) 1) "s" "")
- feed-name
- (file-name-nondirectory feed-file) feed-headline)
- (run-hooks 'org-feed-after-adding-hook)
- (length new))))))
- ;;;###autoload
- (defun org-feed-goto-inbox (feed)
- "Go to the inbox that captures feed FEED."
- (interactive
- (list (if (= (length org-feed-alist) 1)
- (car org-feed-alist)
- (org-completing-read "Feed name: " org-feed-alist))))
- (if (stringp feed) (setq feed (assoc feed org-feed-alist)))
- (unless feed
- (error "No such feed in `org-feed-alist"))
- (org-feed-goto-inbox (nth 2 feed) (nth 3 feed)))
- (defun org-feed-goto-inbox-internal (file heading)
- "Find or create HEADING in FILE.
- Switch to that buffer, and return the position of that headline."
- (find-file file)
- (widen)
- (goto-char (point-min))
- (if (re-search-forward
- (concat "^\\*+[ \t]+" heading "[ \t]*\\(:.*?:[ \t]*\\)?$")
- nil t)
- (goto-char (match-beginning 0))
- (goto-char (point-max))
- (insert "\n\n* " heading "\n\n")
- (org-back-to-heading t))
- (point))
- (defun org-feed-get-old-guids (pos)
- "Get the list of old GUIDs from the entry at POS.
- This will find the FEEDGUIDS drawer and extract the IDs."
- (save-excursion
- (goto-char pos)
- (let ((end (save-excursion (org-end-of-subtree t t))))
- (if (re-search-forward
- "^[ \t]*:FEEDGUIDS:[ \t]*\n\\([^\000]*?\\)\n[ \t]*:END:"
- end t)
- (org-split-string (org-trim (org-match-string-no-properties 1))
- "[ \t]*\n[ \t]*")
- nil))))
- (defun org-feed-add-guids (pos replace &rest entries)
- "Add GUIDs for headline at POS.
- When REPLACE is non-nil, replace all GUIDs by the new ones."
- (save-excursion
- (goto-char pos)
- (let ((end (save-excursion (org-end-of-subtree t t)))
- guid)
- (if (re-search-forward "^[ \t]*:FEEDGUIDS:[ \t]*\n" end t)
- (progn
- (goto-char (match-end 0))
- (when replace
- (delete-region (point)
- (save-excursion
- (and (re-search-forward "^[ \t]*:END:" nil t)
- (match-beginning 0))))))
- (outline-next-heading)
- (insert " :FEEDGUIDS:\n :END:\n")
- (beginning-of-line 0))
- (while entries
- (when (setq guid (plist-get (pop entries) :guid))
- (insert " " guid "\n"))))))
- (defun org-feed-add-items (pos &rest entries)
- "Add the formatted items to the headline as POS."
- (let (entry level)
- (save-excursion
- (goto-char pos)
- (unless (looking-at org-complex-heading-regexp)
- (error "Wrong position"))
- (setq level (org-get-valid-level (length (match-string 1)) 1))
- (org-end-of-subtree t t)
- (skip-chars-backward " \t\n")
- (beginning-of-line 2)
- (setq pos (point))
- (while (setq entry (pop entries))
- (org-paste-subtree level (plist-get entry :formatted-for-org) 'yank))
- (org-mark-ring-push pos))))
- (defun org-feed-format-entry (entry template)
- "Format ENTRY so that it can be inserted into an Org file.
- ENTRY is a property list. This function adds a `:formatted-for-org' property
- and returns the full property list.
- If that property is already present, nothing changes."
- (unless (or (not entry) ; not an entry at all
- (plist-get entry :formatted-for-org)) ; already formatted
- (let (dlines fmt tmp indent)
- (setq dlines (org-split-string (or (plist-get entry :description) "???")
- "\n")
- v-h (or (plist-get entry :title) (car dlines) "???")
- time (or (if (plist-get entry :pubDate)
- (org-read-date t t (plist-get entry :pubDate)))
- (current-time))
- v-t (format-time-string (org-time-stamp-format nil nil) time)
- v-T (format-time-string (org-time-stamp-format t nil) time)
- v-u (format-time-string (org-time-stamp-format nil t) time)
- v-U (format-time-string (org-time-stamp-format t t) time)
- v-a (if (setq tmp (or (and (plist-get entry :guid-permalink)
- (plist-get entry :guid))
- (plist-get entry :link)))
- (concat "[[" tmp "]]\n")
- ""))
- (with-temp-buffer
- (insert template)
- (debug)
- (goto-char (point-min))
- (while (re-search-forward "%\\([a-zA-Z]+\\)" nil t)
- (setq name (match-string 1))
- (cond
- ((member name '("h" "t" "T" "u" "U" "a"))
- (replace-match (symbol-value (intern (concat "v-" name))) t t))
- ((setq tmp (plist-get entry (intern (concat ":" name))))
- (save-excursion
- (save-match-data
- (beginning-of-line 1)
- (when (looking-at (concat "^\\([ \t]*\\)%" name "[ \t]*$"))
- (setq tmp (org-feed-make-indented-block
- tmp (org-get-indentation))))))
- (replace-match tmp t t))
- t))
- (setq entry (plist-put entry :formatted-for-org (buffer-string))))))
- entry)
- (defun org-feed-make-indented-block (s n)
- "Add indentaton of N spaces to a multiline string S."
- (if (not (string-match "\n" s))
- s
- (mapconcat 'identity
- (org-split-string s "\n")
- (concat "\n" (make-string n ?\ )))))
- (defun org-feed-get-feed (url)
- "Get the RSS feed file at URL and return the buffer."
- (cond
- ((eq org-feed-retrieve-method 'url-retrieve-synchronously)
- (url-retrieve-synchronously url))
- ((eq org-feed-retrieve-method 'curl)
- (ignore-errors (kill-buffer org-feed-buffer))
- (call-process "curl" nil org-feed-buffer nil url)
- org-feed-buffer)
- ((eq org-feed-retrieve-method 'wget)
- (ignore-errors (kill-buffer org-feed-buffer))
- (call-process "curl" nil org-feed-buffer nil "-q" "-O" "-" url)
- org-feed-buffer)
- ((functionp org-feed-retrieve-method)
- (funcall org-feed-retrieve-method url))))
- (defun org-feed-parse-feed (buffer)
- "Parse BUFFER for RS feed entries.
- Returns a list of entries, with each entry a property list,
- containing the properties `:guid' and `:item-full-text'."
- (let (entries beg end item guid entry)
- (with-current-buffer buffer
- (widen)
- (goto-char (point-min))
- (while (re-search-forward "<item>" nil t)
- (setq beg (point)
- end (and (re-search-forward "</item>" nil t)
- (match-beginning 0)))
- (setq item (buffer-substring beg end)
- guid (if (string-match "<guid\\>.*?>\\(.*?\\)</guid>" item)
- (org-match-string-no-properties 1 item)))
- (setq entry (list :guid guid :item-full-text item))
- (push entry entries)
- (widen)
- (goto-char end))
- (nreverse entries))))
- (defun org-feed-parse-entry (entry)
- "Parse the `:item-full-text' field for xml tags and create new properties."
- (with-temp-buffer
- (insert (plist-get entry :item-full-text))
- (goto-char (point-min))
- (while (re-search-forward "<\\([a-zA-Z]+\\>\\).*?>\\([^\000]*?\\)</\\1>"
- nil t)
- (setq entry (plist-put entry
- (intern (concat ":" (match-string 1)))
- (match-string 2))))
- (goto-char (point-min))
- (unless (re-search-forward "isPermaLink[ \t]*=[ \t]*\"false\"" nil t)
- (setq entry (plist-put entry :guid-permalink t))))
- entry)
- (provide 'org-feed)
- ;;; org-feed.el ends here
- ;; arch-tag: 0929b557-9bc4-47f4-9633-30a12dbb5ae2
|