ol-w3m.el 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. ;;; ol-w3m.el --- Copy and Paste From W3M -*- lexical-binding: t; -*-
  2. ;; Copyright (C) 2008-2022 Free Software Foundation, Inc.
  3. ;; Author: Andy Stewart <lazycat dot manatee at gmail dot com>
  4. ;; Keywords: outlines, hypermedia, calendar, wp
  5. ;; URL: https://orgmode.org
  6. ;;
  7. ;; This file is part of GNU Emacs.
  8. ;; GNU Emacs is free software: you can redistribute it and/or modify
  9. ;; it under the terms of the GNU General Public License as published by
  10. ;; the Free Software Foundation, either version 3 of the License, or
  11. ;; (at your option) any later version.
  12. ;; GNU Emacs is distributed in the hope that it will be useful,
  13. ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. ;; GNU General Public License for more details.
  16. ;; You should have received a copy of the GNU General Public License
  17. ;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
  18. ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  19. ;;
  20. ;;; Commentary:
  21. ;; This file implements copying HTML content from a w3m buffer and
  22. ;; transforming the text on the fly so that it can be pasted into an
  23. ;; Org buffer with hot links. It will also work for regions in gnus
  24. ;; buffers that have been washed with w3m.
  25. ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
  26. ;;
  27. ;;; Acknowledgments:
  28. ;; Richard Riley <rileyrgdev at googlemail dot com>
  29. ;;
  30. ;; The idea of transforming the HTML content with Org syntax is
  31. ;; proposed by Richard, I'm just coding it.
  32. ;;
  33. ;;; Code:
  34. (require 'org-macs)
  35. (org-assert-version)
  36. (require 'ol)
  37. (defvar w3m-current-url)
  38. (defvar w3m-current-title)
  39. (org-link-set-parameters "w3m" :store #'org-w3m-store-link)
  40. (defun org-w3m-store-link ()
  41. "Store a link to a w3m buffer."
  42. (when (eq major-mode 'w3m-mode)
  43. (org-link-store-props
  44. :type "w3m"
  45. :link w3m-current-url
  46. :url (url-view-url t)
  47. :description (or w3m-current-title w3m-current-url))))
  48. (defun org-w3m-copy-for-org-mode ()
  49. "Copy current buffer content or active region with Org style links.
  50. This will encode `link-title' and `link-location' with
  51. `org-link-make-string', and insert the transformed test into the kill ring,
  52. so that it can be yanked into an Org buffer with links working correctly."
  53. (interactive)
  54. (let* ((regionp (org-region-active-p))
  55. (transform-start (point-min))
  56. (transform-end (point-max))
  57. return-content
  58. link-location link-title
  59. temp-position out-bound)
  60. (when regionp
  61. (setq transform-start (region-beginning))
  62. (setq transform-end (region-end))
  63. ;; Deactivate mark if current mark is activate.
  64. (deactivate-mark))
  65. (message "Transforming links...")
  66. (save-excursion
  67. (goto-char transform-start)
  68. (while (and (not out-bound) ; still inside region to copy
  69. (not (org-w3m-no-next-link-p))) ; no next link current buffer
  70. ;; store current point before jump next anchor
  71. (setq temp-position (point))
  72. ;; move to next anchor when current point is not at anchor
  73. (or (get-text-property (point) 'w3m-href-anchor) (org-w3m-get-next-link-start))
  74. (cond
  75. ((<= (point) transform-end) ; point is inside transform bound
  76. ;; get content between two links.
  77. (when (> (point) temp-position)
  78. (setq return-content (concat return-content
  79. (buffer-substring
  80. temp-position (point)))))
  81. (cond
  82. ((setq link-location (get-text-property (point) 'w3m-href-anchor))
  83. ;; current point is a link
  84. ;; (we thus also got link location at current point)
  85. ;; get link title at current point.
  86. (setq link-title (buffer-substring (point)
  87. (org-w3m-get-anchor-end)))
  88. ;; concat Org style url to `return-content'.
  89. (setq return-content
  90. (concat return-content
  91. (if (org-string-nw-p link-location)
  92. (org-link-make-string link-location link-title)
  93. link-title))))
  94. ((setq link-location (get-text-property (point) 'w3m-image))
  95. ;; current point is an image
  96. ;; (we thus also got image link location at current point)
  97. ;; get link title at current point.
  98. (setq link-title (buffer-substring (point) (org-w3m-get-image-end)))
  99. ;; concat Org style url to `return-content'.
  100. (setq return-content
  101. (concat return-content
  102. (if (org-string-nw-p link-location)
  103. (org-link-make-string link-location link-title)
  104. link-title))))
  105. (t nil))); current point is neither a link nor an image
  106. (t ; point is NOT inside transform bound
  107. (goto-char temp-position) ; reset point before jump next anchor
  108. (setq out-bound t)))) ; for break out `while' loop
  109. ;; add the rest until end of the region to be copied
  110. (when (< (point) transform-end)
  111. (setq return-content
  112. (concat return-content
  113. (buffer-substring (point) transform-end))))
  114. (org-kill-new return-content)
  115. (message "Transforming links...done, use C-y to insert text into Org file")
  116. (message "Copy with link transformation complete."))))
  117. (defun org-w3m-get-anchor-start ()
  118. "Move cursor to the start of current anchor. Return point."
  119. ;; get start position of anchor or current point
  120. ;; NOTE: This function seems never to be used. Should it be removed?
  121. (goto-char (or (previous-single-property-change (point) 'w3m-anchor-sequence)
  122. (point))))
  123. (defun org-w3m-get-anchor-end ()
  124. "Move cursor to the end of current anchor. Return point."
  125. ;; get end position of anchor or point
  126. (goto-char (or (next-single-property-change (point) 'w3m-anchor-sequence)
  127. (point))))
  128. (defun org-w3m-get-image-end ()
  129. "Move cursor to the end of current image. Return point."
  130. ;; get end position of image or point
  131. ;; NOTE: Function `org-w3m-get-image-start' was not created because
  132. ;; function `org-w3m-get-anchor-start' is never used.
  133. (goto-char (or (next-single-property-change (point) 'w3m-image)
  134. (point))))
  135. (defun org-w3m-get-next-link-start ()
  136. "Move cursor to the start of next link or image. Return point."
  137. (let (pos start-pos anchor-pos image-pos)
  138. (setq pos (setq start-pos (point)))
  139. (setq anchor-pos
  140. (catch 'reach
  141. (while (setq pos (next-single-property-change pos 'w3m-anchor-sequence))
  142. (when (get-text-property pos 'w3m-href-anchor)
  143. (throw 'reach pos)))))
  144. (setq pos start-pos)
  145. (setq image-pos
  146. (catch 'reach
  147. (while (setq pos (next-single-property-change pos 'w3m-image))
  148. (when (get-text-property pos 'w3m-image)
  149. (throw 'reach pos)))))
  150. (goto-char (min (or anchor-pos (point-max)) (or image-pos (point-max))))))
  151. (defun org-w3m-get-prev-link-start ()
  152. "Move cursor to the start of previous link. Return point."
  153. ;; NOTE: This function is only called by `org-w3m-no-prev-link-p',
  154. ;; which itself seems never to be used. Should it be removed?
  155. ;;
  156. ;; WARNING: This function has not been updated to account for
  157. ;; `w3m-image'. See `org-w3m-get-next-link-start'.
  158. (catch 'reach
  159. (let ((pos (point)))
  160. (while (setq pos (previous-single-property-change pos 'w3m-anchor-sequence))
  161. (when (get-text-property pos 'w3m-href-anchor)
  162. ;; jump to previous anchor
  163. (goto-char pos)
  164. ;; return point when current is valid link
  165. (throw 'reach nil)))))
  166. (point))
  167. (defun org-w3m-no-next-link-p ()
  168. "Whether there is no next link after the cursor.
  169. Return t if there is no next link; otherwise, return nil."
  170. (save-excursion
  171. (equal (point) (org-w3m-get-next-link-start))))
  172. (defun org-w3m-no-prev-link-p ()
  173. "Whether there is no previous link after the cursor.
  174. Return t if there is no previous link; otherwise, return nil."
  175. ;; NOTE: This function seems never to be used. Should it be removed?
  176. (save-excursion
  177. (equal (point) (org-w3m-get-prev-link-start))))
  178. ;; Install keys into the w3m keymap
  179. (defvar w3m-mode-map)
  180. (defvar w3m-minor-mode-map)
  181. (when (and (boundp 'w3m-mode-map)
  182. (keymapp w3m-mode-map))
  183. (define-key w3m-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  184. (define-key w3m-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode))
  185. (when (and (boundp 'w3m-minor-mode-map)
  186. (keymapp w3m-minor-mode-map))
  187. (define-key w3m-minor-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  188. (define-key w3m-minor-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode))
  189. (add-hook
  190. 'w3m-mode-hook
  191. (lambda ()
  192. (define-key w3m-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  193. (define-key w3m-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode)))
  194. (add-hook
  195. 'w3m-minor-mode-hook
  196. (lambda ()
  197. (define-key w3m-minor-mode-map "\C-c\C-x\M-w" 'org-w3m-copy-for-org-mode)
  198. (define-key w3m-minor-mode-map "\C-c\C-x\C-w" 'org-w3m-copy-for-org-mode)))
  199. (provide 'ol-w3m)
  200. ;;; ol-w3m.el ends here