ox-rss.el 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415
  1. ;;; ox-rss.el --- RSS 2.0 Back-End for Org Export Engine
  2. ;; Copyright (C) 2013-2015 Bastien Guerry
  3. ;; Author: Bastien Guerry <bzg@gnu.org>
  4. ;; Keywords: org, wp, blog, feed, rss
  5. ;; This file is not yet part of GNU Emacs.
  6. ;; This program is free software: you can redistribute it and/or modify
  7. ;; it under the terms of the GNU General Public License as published by
  8. ;; the Free Software Foundation, either version 3 of the License, or
  9. ;; (at your option) any later version.
  10. ;; This program is distributed in the hope that it will be useful,
  11. ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. ;; GNU General Public License for more details.
  14. ;; You should have received a copy of the GNU General Public License
  15. ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
  16. ;;; Commentary:
  17. ;; This library implements a RSS 2.0 back-end for Org exporter, based on
  18. ;; the `html' back-end.
  19. ;;
  20. ;; It requires Emacs 24.1 at least.
  21. ;;
  22. ;; It provides two commands for export, depending on the desired output:
  23. ;; `org-rss-export-as-rss' (temporary buffer) and `org-rss-export-to-rss'
  24. ;; (as a ".xml" file).
  25. ;;
  26. ;; This backend understands two new option keywords:
  27. ;;
  28. ;; #+RSS_EXTENSION: xml
  29. ;; #+RSS_IMAGE_URL: http://myblog.org/mypicture.jpg
  30. ;;
  31. ;; It uses #+HTML_LINK_HOME: to set the base url of the feed.
  32. ;;
  33. ;; Exporting an Org file to RSS modifies each top-level entry by adding a
  34. ;; PUBDATE property. If `org-rss-use-entry-url-as-guid', it will also add
  35. ;; an ID property, later used as the guid for the feed's item.
  36. ;;
  37. ;; The top-level headline is used as the title of each RSS item unless
  38. ;; an RSS_TITLE property is set on the headline.
  39. ;;
  40. ;; You typically want to use it within a publishing project like this:
  41. ;;
  42. ;; (add-to-list
  43. ;; 'org-publish-project-alist
  44. ;; '("homepage_rss"
  45. ;; :base-directory "~/myhomepage/"
  46. ;; :base-extension "org"
  47. ;; :rss-image-url "http://lumiere.ens.fr/~guerry/images/faces/15.png"
  48. ;; :html-link-home "http://lumiere.ens.fr/~guerry/"
  49. ;; :html-link-use-abs-url t
  50. ;; :rss-extension "xml"
  51. ;; :publishing-directory "/home/guerry/public_html/"
  52. ;; :publishing-function (org-rss-publish-to-rss)
  53. ;; :section-numbers nil
  54. ;; :exclude ".*" ;; To exclude all files...
  55. ;; :include ("index.org") ;; ... except index.org.
  56. ;; :table-of-contents nil))
  57. ;;
  58. ;; ... then rsync /home/guerry/public_html/ with your server.
  59. ;;
  60. ;; By default, the permalink for a blog entry points to the headline.
  61. ;; You can specify a different one by using the :RSS_PERMALINK:
  62. ;; property within an entry.
  63. ;;; Code:
  64. (require 'ox-html)
  65. (declare-function url-encode-url "url-util" (url))
  66. ;;; Variables and options
  67. (defgroup org-export-rss nil
  68. "Options specific to RSS export back-end."
  69. :tag "Org RSS"
  70. :group 'org-export
  71. :version "24.4"
  72. :package-version '(Org . "8.0"))
  73. (defcustom org-rss-image-url "http://orgmode.org/img/org-mode-unicorn-logo.png"
  74. "The URL of the an image for the RSS feed."
  75. :group 'org-export-rss
  76. :type 'string)
  77. (defcustom org-rss-extension "xml"
  78. "File extension for the RSS 2.0 feed."
  79. :group 'org-export-rss
  80. :type 'string)
  81. (defcustom org-rss-categories 'from-tags
  82. "Where to extract items category information from.
  83. The default is to extract categories from the tags of the
  84. headlines. When set to another value, extract the category
  85. from the :CATEGORY: property of the entry."
  86. :group 'org-export-rss
  87. :type '(choice
  88. (const :tag "From tags" from-tags)
  89. (const :tag "From the category property" from-category)))
  90. (defcustom org-rss-use-entry-url-as-guid t
  91. "Use the URL for the <guid> metatag?
  92. When nil, Org will create ids using `org-icalendar-create-uid'."
  93. :group 'org-export-rss
  94. :type 'boolean)
  95. ;;; Define backend
  96. (org-export-define-derived-backend 'rss 'html
  97. :menu-entry
  98. '(?r "Export to RSS"
  99. ((?R "As RSS buffer"
  100. (lambda (a s v b) (org-rss-export-as-rss a s v)))
  101. (?r "As RSS file" (lambda (a s v b) (org-rss-export-to-rss a s v)))
  102. (?o "As RSS file and open"
  103. (lambda (a s v b)
  104. (if a (org-rss-export-to-rss t s v)
  105. (org-open-file (org-rss-export-to-rss nil s v)))))))
  106. :options-alist
  107. '((:with-toc nil nil nil) ;; Never include HTML's toc
  108. (:rss-extension "RSS_EXTENSION" nil org-rss-extension)
  109. (:rss-image-url "RSS_IMAGE_URL" nil org-rss-image-url)
  110. (:rss-categories nil nil org-rss-categories))
  111. :filters-alist '((:filter-final-output . org-rss-final-function))
  112. :translate-alist '((headline . org-rss-headline)
  113. (comment . (lambda (&rest args) ""))
  114. (comment-block . (lambda (&rest args) ""))
  115. (timestamp . (lambda (&rest args) ""))
  116. (plain-text . org-rss-plain-text)
  117. (section . org-rss-section)
  118. (template . org-rss-template)))
  119. ;;; Export functions
  120. ;;;###autoload
  121. (defun org-rss-export-as-rss (&optional async subtreep visible-only)
  122. "Export current buffer to a RSS buffer.
  123. If narrowing is active in the current buffer, only export its
  124. narrowed part.
  125. If a region is active, export that region.
  126. A non-nil optional argument ASYNC means the process should happen
  127. asynchronously. The resulting buffer should be accessible
  128. through the `org-export-stack' interface.
  129. When optional argument SUBTREEP is non-nil, export the sub-tree
  130. at point, extracting information from the headline properties
  131. first.
  132. When optional argument VISIBLE-ONLY is non-nil, don't export
  133. contents of hidden elements.
  134. Export is done in a buffer named \"*Org RSS Export*\", which will
  135. be displayed when `org-export-show-temporary-export-buffer' is
  136. non-nil."
  137. (interactive)
  138. (let ((file (buffer-file-name (buffer-base-buffer))))
  139. (org-icalendar-create-uid file 'warn-user)
  140. (org-rss-add-pubdate-property))
  141. (org-export-to-buffer 'rss "*Org RSS Export*"
  142. async subtreep visible-only nil nil (lambda () (text-mode))))
  143. ;;;###autoload
  144. (defun org-rss-export-to-rss (&optional async subtreep visible-only)
  145. "Export current buffer to a RSS file.
  146. If narrowing is active in the current buffer, only export its
  147. narrowed part.
  148. If a region is active, export that region.
  149. A non-nil optional argument ASYNC means the process should happen
  150. asynchronously. The resulting file should be accessible through
  151. the `org-export-stack' interface.
  152. When optional argument SUBTREEP is non-nil, export the sub-tree
  153. at point, extracting information from the headline properties
  154. first.
  155. When optional argument VISIBLE-ONLY is non-nil, don't export
  156. contents of hidden elements.
  157. Return output file's name."
  158. (interactive)
  159. (let ((file (buffer-file-name (buffer-base-buffer))))
  160. (org-icalendar-create-uid file 'warn-user)
  161. (org-rss-add-pubdate-property))
  162. (let ((outfile (org-export-output-file-name
  163. (concat "." org-rss-extension) subtreep)))
  164. (org-export-to-file 'rss outfile async subtreep visible-only)))
  165. ;;;###autoload
  166. (defun org-rss-publish-to-rss (plist filename pub-dir)
  167. "Publish an org file to RSS.
  168. FILENAME is the filename of the Org file to be published. PLIST
  169. is the property list for the given project. PUB-DIR is the
  170. publishing directory.
  171. Return output file name."
  172. (let ((bf (get-file-buffer filename)))
  173. (if bf
  174. (with-current-buffer bf
  175. (org-icalendar-create-uid filename 'warn-user)
  176. (org-rss-add-pubdate-property)
  177. (write-file filename))
  178. (find-file filename)
  179. (org-icalendar-create-uid filename 'warn-user)
  180. (org-rss-add-pubdate-property)
  181. (write-file filename) (kill-buffer)))
  182. (org-publish-org-to
  183. 'rss filename (concat "." org-rss-extension) plist pub-dir))
  184. ;;; Main transcoding functions
  185. (defun org-rss-headline (headline contents info)
  186. "Transcode HEADLINE element into RSS format.
  187. CONTENTS is the headline contents. INFO is a plist used as a
  188. communication channel."
  189. (unless (or (org-element-property :footnote-section-p headline)
  190. ;; Only consider first-level headlines
  191. (> (org-export-get-relative-level headline info) 1))
  192. (let* ((author (and (plist-get info :with-author)
  193. (let ((auth (plist-get info :author)))
  194. (and auth (org-export-data auth info)))))
  195. (htmlext (plist-get info :html-extension))
  196. (hl-number (org-export-get-headline-number headline info))
  197. (hl-home (file-name-as-directory (plist-get info :html-link-home)))
  198. (hl-pdir (plist-get info :publishing-directory))
  199. (hl-perm (org-element-property :RSS_PERMALINK headline))
  200. (anchor
  201. (org-export-solidify-link-text
  202. (or (org-element-property :CUSTOM_ID headline)
  203. (concat "sec-" (mapconcat 'number-to-string hl-number "-")))))
  204. (category (org-rss-plain-text
  205. (or (org-element-property :CATEGORY headline) "") info))
  206. (pubdate0 (org-element-property :PUBDATE headline))
  207. (pubdate (let ((system-time-locale "C"))
  208. (if pubdate0
  209. (format-time-string
  210. "%a, %d %b %Y %H:%M:%S %z"
  211. (org-time-string-to-time pubdate0)))))
  212. (title (or (org-element-property :RSS_TITLE headline)
  213. (replace-regexp-in-string
  214. org-bracket-link-regexp
  215. (lambda (m) (or (match-string 3 m)
  216. (match-string 1 m)))
  217. (org-element-property :raw-value headline))))
  218. (publink
  219. (or (and hl-perm (concat (or hl-home hl-pdir) hl-perm))
  220. (concat
  221. (or hl-home hl-pdir)
  222. (file-name-nondirectory
  223. (file-name-sans-extension
  224. (plist-get info :input-file))) "." htmlext "#" anchor)))
  225. (guid (if org-rss-use-entry-url-as-guid
  226. publink
  227. (org-rss-plain-text
  228. (or (org-element-property :ID headline)
  229. (org-element-property :CUSTOM_ID headline)
  230. publink)
  231. info))))
  232. (if (not pubdate0) "" ;; Skip entries with no PUBDATE prop
  233. (format
  234. (concat
  235. "<item>\n"
  236. "<title>%s</title>\n"
  237. "<link>%s</link>\n"
  238. "<author>%s</author>\n"
  239. "<guid isPermaLink=\"false\">%s</guid>\n"
  240. "<pubDate>%s</pubDate>\n"
  241. (org-rss-build-categories headline info) "\n"
  242. "<description><![CDATA[%s]]></description>\n"
  243. "</item>\n")
  244. title publink author guid pubdate contents)))))
  245. (defun org-rss-build-categories (headline info)
  246. "Build categories for the RSS item."
  247. (if (eq (plist-get info :rss-categories) 'from-tags)
  248. (mapconcat
  249. (lambda (c) (format "<category><![CDATA[%s]]></category>" c))
  250. (org-element-property :tags headline)
  251. "\n")
  252. (let ((c (org-element-property :CATEGORY headline)))
  253. (format "<category><![CDATA[%s]]></category>" c))))
  254. (defun org-rss-template (contents info)
  255. "Return complete document string after RSS conversion.
  256. CONTENTS is the transcoded contents string. INFO is a plist used
  257. as a communication channel."
  258. (concat
  259. (format "<?xml version=\"1.0\" encoding=\"%s\"?>"
  260. (symbol-name org-html-coding-system))
  261. "\n<rss version=\"2.0\"
  262. xmlns:content=\"http://purl.org/rss/1.0/modules/content/\"
  263. xmlns:wfw=\"http://wellformedweb.org/CommentAPI/\"
  264. xmlns:dc=\"http://purl.org/dc/elements/1.1/\"
  265. xmlns:atom=\"http://www.w3.org/2005/Atom\"
  266. xmlns:sy=\"http://purl.org/rss/1.0/modules/syndication/\"
  267. xmlns:slash=\"http://purl.org/rss/1.0/modules/slash/\"
  268. xmlns:georss=\"http://www.georss.org/georss\"
  269. xmlns:geo=\"http://www.w3.org/2003/01/geo/wgs84_pos#\"
  270. xmlns:media=\"http://search.yahoo.com/mrss/\">"
  271. "<channel>"
  272. (org-rss-build-channel-info info) "\n"
  273. contents
  274. "</channel>\n"
  275. "</rss>"))
  276. (defun org-rss-build-channel-info (info)
  277. "Build the RSS channel information."
  278. (let* ((system-time-locale "C")
  279. (title (plist-get info :title))
  280. (email (org-export-data (plist-get info :email) info))
  281. (author (and (plist-get info :with-author)
  282. (let ((auth (plist-get info :author)))
  283. (and auth (org-export-data auth info)))))
  284. (date (format-time-string "%a, %d %b %Y %H:%M:%S %z")) ;; RFC 882
  285. (description (org-export-data (plist-get info :description) info))
  286. (lang (plist-get info :language))
  287. (keywords (plist-get info :keywords))
  288. (rssext (plist-get info :rss-extension))
  289. (blogurl (or (plist-get info :html-link-home)
  290. (plist-get info :publishing-directory)))
  291. (image (url-encode-url (plist-get info :rss-image-url)))
  292. (ifile (plist-get info :input-file))
  293. (publink
  294. (concat (file-name-as-directory blogurl)
  295. (file-name-nondirectory
  296. (file-name-sans-extension ifile))
  297. "." rssext)))
  298. (format
  299. "\n<title>%s</title>
  300. <atom:link href=\"%s\" rel=\"self\" type=\"application/rss+xml\" />
  301. <link>%s</link>
  302. <description><![CDATA[%s]]></description>
  303. <language>%s</language>
  304. <pubDate>%s</pubDate>
  305. <lastBuildDate>%s</lastBuildDate>
  306. <generator>%s</generator>
  307. <webMaster>%s (%s)</webMaster>
  308. <image>
  309. <url>%s</url>
  310. <title>%s</title>
  311. <link>%s</link>
  312. </image>
  313. "
  314. title publink blogurl description lang date date
  315. (concat (format "Emacs %d.%d"
  316. emacs-major-version
  317. emacs-minor-version)
  318. " Org-mode " (org-version))
  319. email author image title blogurl)))
  320. (defun org-rss-section (section contents info)
  321. "Transcode SECTION element into RSS format.
  322. CONTENTS is the section contents. INFO is a plist used as
  323. a communication channel."
  324. contents)
  325. (defun org-rss-timestamp (timestamp contents info)
  326. "Transcode a TIMESTAMP object from Org to RSS.
  327. CONTENTS is nil. INFO is a plist holding contextual
  328. information."
  329. (org-html-encode-plain-text
  330. (org-timestamp-translate timestamp)))
  331. (defun org-rss-plain-text (contents info)
  332. "Convert plain text into RSS encoded text."
  333. (let (output)
  334. (setq output (org-html-encode-plain-text contents)
  335. output (org-export-activate-smart-quotes
  336. output :html info))))
  337. ;;; Filters
  338. (defun org-rss-final-function (contents backend info)
  339. "Prettify the RSS output."
  340. (with-temp-buffer
  341. (xml-mode)
  342. (insert contents)
  343. (indent-region (point-min) (point-max))
  344. (buffer-substring-no-properties (point-min) (point-max))))
  345. ;;; Miscellaneous
  346. (defun org-rss-add-pubdate-property ()
  347. "Set the PUBDATE property for top-level headlines."
  348. (let (msg)
  349. (org-map-entries
  350. (lambda ()
  351. (let* ((entry (org-element-at-point))
  352. (level (org-element-property :level entry)))
  353. (when (= level 1)
  354. (unless (org-entry-get (point) "PUBDATE")
  355. (setq msg t)
  356. (org-set-property
  357. "PUBDATE" (format-time-string
  358. (cdr org-time-stamp-formats)))))))
  359. nil nil 'comment 'archive)
  360. (when msg
  361. (message "Property PUBDATE added to top-level entries in %s"
  362. (buffer-file-name))
  363. (sit-for 2))))
  364. (provide 'ox-rss)
  365. ;;; ox-rss.el ends here